Merge branch 'jk/git-tricks'
[git] / gitweb / gitweb.perl
1 #!/usr/bin/perl
2
3 # gitweb - simple web interface to track changes in git repositories
4 #
5 # (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
6 # (C) 2005, Christian Gierke
7 #
8 # This program is licensed under the GPLv2
9
10 use 5.008;
11 use strict;
12 use warnings;
13 use CGI qw(:standard :escapeHTML -nosticky);
14 use CGI::Util qw(unescape);
15 use CGI::Carp qw(fatalsToBrowser set_message);
16 use Encode;
17 use Fcntl ':mode';
18 use File::Find qw();
19 use File::Basename qw(basename);
20 use Time::HiRes qw(gettimeofday tv_interval);
21 binmode STDOUT, ':utf8';
22
23 our $t0 = [ gettimeofday() ];
24 our $number_of_git_cmds = 0;
25
26 BEGIN {
27         CGI->compile() if $ENV{'MOD_PERL'};
28 }
29
30 our $version = "++GIT_VERSION++";
31
32 our ($my_url, $my_uri, $base_url, $path_info, $home_link);
33 sub evaluate_uri {
34         our $cgi;
35
36         our $my_url = $cgi->url();
37         our $my_uri = $cgi->url(-absolute => 1);
38
39         # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
40         # needed and used only for URLs with nonempty PATH_INFO
41         our $base_url = $my_url;
42
43         # When the script is used as DirectoryIndex, the URL does not contain the name
44         # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
45         # have to do it ourselves. We make $path_info global because it's also used
46         # later on.
47         #
48         # Another issue with the script being the DirectoryIndex is that the resulting
49         # $my_url data is not the full script URL: this is good, because we want
50         # generated links to keep implying the script name if it wasn't explicitly
51         # indicated in the URL we're handling, but it means that $my_url cannot be used
52         # as base URL.
53         # Therefore, if we needed to strip PATH_INFO, then we know that we have
54         # to build the base URL ourselves:
55         our $path_info = $ENV{"PATH_INFO"};
56         if ($path_info) {
57                 if ($my_url =~ s,\Q$path_info\E$,, &&
58                     $my_uri =~ s,\Q$path_info\E$,, &&
59                     defined $ENV{'SCRIPT_NAME'}) {
60                         $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
61                 }
62         }
63
64         # target of the home link on top of all pages
65         our $home_link = $my_uri || "/";
66 }
67
68 # core git executable to use
69 # this can just be "git" if your webserver has a sensible PATH
70 our $GIT = "++GIT_BINDIR++/git";
71
72 # absolute fs-path which will be prepended to the project path
73 #our $projectroot = "/pub/scm";
74 our $projectroot = "++GITWEB_PROJECTROOT++";
75
76 # fs traversing limit for getting project list
77 # the number is relative to the projectroot
78 our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
79
80 # string of the home link on top of all pages
81 our $home_link_str = "++GITWEB_HOME_LINK_STR++";
82
83 # name of your site or organization to appear in page titles
84 # replace this with something more descriptive for clearer bookmarks
85 our $site_name = "++GITWEB_SITENAME++"
86                  || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
87
88 # html snippet to include in the <head> section of each page
89 our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
90 # filename of html text to include at top of each page
91 our $site_header = "++GITWEB_SITE_HEADER++";
92 # html text to include at home page
93 our $home_text = "++GITWEB_HOMETEXT++";
94 # filename of html text to include at bottom of each page
95 our $site_footer = "++GITWEB_SITE_FOOTER++";
96
97 # URI of stylesheets
98 our @stylesheets = ("++GITWEB_CSS++");
99 # URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
100 our $stylesheet = undef;
101 # URI of GIT logo (72x27 size)
102 our $logo = "++GITWEB_LOGO++";
103 # URI of GIT favicon, assumed to be image/png type
104 our $favicon = "++GITWEB_FAVICON++";
105 # URI of gitweb.js (JavaScript code for gitweb)
106 our $javascript = "++GITWEB_JS++";
107
108 # URI and label (title) of GIT logo link
109 #our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
110 #our $logo_label = "git documentation";
111 our $logo_url = "http://git-scm.com/";
112 our $logo_label = "git homepage";
113
114 # source of projects list
115 our $projects_list = "++GITWEB_LIST++";
116
117 # the width (in characters) of the projects list "Description" column
118 our $projects_list_description_width = 25;
119
120 # group projects by category on the projects list
121 # (enabled if this variable evaluates to true)
122 our $projects_list_group_categories = 0;
123
124 # default category if none specified
125 # (leave the empty string for no category)
126 our $project_list_default_category = "";
127
128 # default order of projects list
129 # valid values are none, project, descr, owner, and age
130 our $default_projects_order = "project";
131
132 # show repository only if this file exists
133 # (only effective if this variable evaluates to true)
134 our $export_ok = "++GITWEB_EXPORT_OK++";
135
136 # show repository only if this subroutine returns true
137 # when given the path to the project, for example:
138 #    sub { return -e "$_[0]/git-daemon-export-ok"; }
139 our $export_auth_hook = undef;
140
141 # only allow viewing of repositories also shown on the overview page
142 our $strict_export = "++GITWEB_STRICT_EXPORT++";
143
144 # list of git base URLs used for URL to where fetch project from,
145 # i.e. full URL is "$git_base_url/$project"
146 our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
147
148 # default blob_plain mimetype and default charset for text/plain blob
149 our $default_blob_plain_mimetype = 'text/plain';
150 our $default_text_plain_charset  = undef;
151
152 # file to use for guessing MIME types before trying /etc/mime.types
153 # (relative to the current git repository)
154 our $mimetypes_file = undef;
155
156 # assume this charset if line contains non-UTF-8 characters;
157 # it should be valid encoding (see Encoding::Supported(3pm) for list),
158 # for which encoding all byte sequences are valid, for example
159 # 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
160 # could be even 'utf-8' for the old behavior)
161 our $fallback_encoding = 'latin1';
162
163 # rename detection options for git-diff and git-diff-tree
164 # - default is '-M', with the cost proportional to
165 #   (number of removed files) * (number of new files).
166 # - more costly is '-C' (which implies '-M'), with the cost proportional to
167 #   (number of changed files + number of removed files) * (number of new files)
168 # - even more costly is '-C', '--find-copies-harder' with cost
169 #   (number of files in the original tree) * (number of new files)
170 # - one might want to include '-B' option, e.g. '-B', '-M'
171 our @diff_opts = ('-M'); # taken from git_commit
172
173 # Disables features that would allow repository owners to inject script into
174 # the gitweb domain.
175 our $prevent_xss = 0;
176
177 # Path to the highlight executable to use (must be the one from
178 # http://www.andre-simon.de due to assumptions about parameters and output).
179 # Useful if highlight is not installed on your webserver's PATH.
180 # [Default: highlight]
181 our $highlight_bin = "++HIGHLIGHT_BIN++";
182
183 # information about snapshot formats that gitweb is capable of serving
184 our %known_snapshot_formats = (
185         # name => {
186         #       'display' => display name,
187         #       'type' => mime type,
188         #       'suffix' => filename suffix,
189         #       'format' => --format for git-archive,
190         #       'compressor' => [compressor command and arguments]
191         #                       (array reference, optional)
192         #       'disabled' => boolean (optional)}
193         #
194         'tgz' => {
195                 'display' => 'tar.gz',
196                 'type' => 'application/x-gzip',
197                 'suffix' => '.tar.gz',
198                 'format' => 'tar',
199                 'compressor' => ['gzip', '-n']},
200
201         'tbz2' => {
202                 'display' => 'tar.bz2',
203                 'type' => 'application/x-bzip2',
204                 'suffix' => '.tar.bz2',
205                 'format' => 'tar',
206                 'compressor' => ['bzip2']},
207
208         'txz' => {
209                 'display' => 'tar.xz',
210                 'type' => 'application/x-xz',
211                 'suffix' => '.tar.xz',
212                 'format' => 'tar',
213                 'compressor' => ['xz'],
214                 'disabled' => 1},
215
216         'zip' => {
217                 'display' => 'zip',
218                 'type' => 'application/x-zip',
219                 'suffix' => '.zip',
220                 'format' => 'zip'},
221 );
222
223 # Aliases so we understand old gitweb.snapshot values in repository
224 # configuration.
225 our %known_snapshot_format_aliases = (
226         'gzip'  => 'tgz',
227         'bzip2' => 'tbz2',
228         'xz'    => 'txz',
229
230         # backward compatibility: legacy gitweb config support
231         'x-gzip' => undef, 'gz' => undef,
232         'x-bzip2' => undef, 'bz2' => undef,
233         'x-zip' => undef, '' => undef,
234 );
235
236 # Pixel sizes for icons and avatars. If the default font sizes or lineheights
237 # are changed, it may be appropriate to change these values too via
238 # $GITWEB_CONFIG.
239 our %avatar_size = (
240         'default' => 16,
241         'double'  => 32
242 );
243
244 # Used to set the maximum load that we will still respond to gitweb queries.
245 # If server load exceed this value then return "503 server busy" error.
246 # If gitweb cannot determined server load, it is taken to be 0.
247 # Leave it undefined (or set to 'undef') to turn off load checking.
248 our $maxload = 300;
249
250 # configuration for 'highlight' (http://www.andre-simon.de/)
251 # match by basename
252 our %highlight_basename = (
253         #'Program' => 'py',
254         #'Library' => 'py',
255         'SConstruct' => 'py', # SCons equivalent of Makefile
256         'Makefile' => 'make',
257 );
258 # match by extension
259 our %highlight_ext = (
260         # main extensions, defining name of syntax;
261         # see files in /usr/share/highlight/langDefs/ directory
262         map { $_ => $_ }
263                 qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
264         # alternate extensions, see /etc/highlight/filetypes.conf
265         'h' => 'c',
266         map { $_ => 'sh'  } qw(bash zsh ksh),
267         map { $_ => 'cpp' } qw(cxx c++ cc),
268         map { $_ => 'php' } qw(php3 php4 php5 phps),
269         map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
270         map { $_ => 'make'} qw(mak mk),
271         map { $_ => 'xml' } qw(xhtml html htm),
272 );
273
274 # You define site-wide feature defaults here; override them with
275 # $GITWEB_CONFIG as necessary.
276 our %feature = (
277         # feature => {
278         #       'sub' => feature-sub (subroutine),
279         #       'override' => allow-override (boolean),
280         #       'default' => [ default options...] (array reference)}
281         #
282         # if feature is overridable (it means that allow-override has true value),
283         # then feature-sub will be called with default options as parameters;
284         # return value of feature-sub indicates if to enable specified feature
285         #
286         # if there is no 'sub' key (no feature-sub), then feature cannot be
287         # overridden
288         #
289         # use gitweb_get_feature(<feature>) to retrieve the <feature> value
290         # (an array) or gitweb_check_feature(<feature>) to check if <feature>
291         # is enabled
292
293         # Enable the 'blame' blob view, showing the last commit that modified
294         # each line in the file. This can be very CPU-intensive.
295
296         # To enable system wide have in $GITWEB_CONFIG
297         # $feature{'blame'}{'default'} = [1];
298         # To have project specific config enable override in $GITWEB_CONFIG
299         # $feature{'blame'}{'override'} = 1;
300         # and in project config gitweb.blame = 0|1;
301         'blame' => {
302                 'sub' => sub { feature_bool('blame', @_) },
303                 'override' => 0,
304                 'default' => [0]},
305
306         # Enable the 'snapshot' link, providing a compressed archive of any
307         # tree. This can potentially generate high traffic if you have large
308         # project.
309
310         # Value is a list of formats defined in %known_snapshot_formats that
311         # you wish to offer.
312         # To disable system wide have in $GITWEB_CONFIG
313         # $feature{'snapshot'}{'default'} = [];
314         # To have project specific config enable override in $GITWEB_CONFIG
315         # $feature{'snapshot'}{'override'} = 1;
316         # and in project config, a comma-separated list of formats or "none"
317         # to disable.  Example: gitweb.snapshot = tbz2,zip;
318         'snapshot' => {
319                 'sub' => \&feature_snapshot,
320                 'override' => 0,
321                 'default' => ['tgz']},
322
323         # Enable text search, which will list the commits which match author,
324         # committer or commit text to a given string.  Enabled by default.
325         # Project specific override is not supported.
326         #
327         # Note that this controls all search features, which means that if
328         # it is disabled, then 'grep' and 'pickaxe' search would also be
329         # disabled.
330         'search' => {
331                 'override' => 0,
332                 'default' => [1]},
333
334         # Enable grep search, which will list the files in currently selected
335         # tree containing the given string. Enabled by default. This can be
336         # potentially CPU-intensive, of course.
337         # Note that you need to have 'search' feature enabled too.
338
339         # To enable system wide have in $GITWEB_CONFIG
340         # $feature{'grep'}{'default'} = [1];
341         # To have project specific config enable override in $GITWEB_CONFIG
342         # $feature{'grep'}{'override'} = 1;
343         # and in project config gitweb.grep = 0|1;
344         'grep' => {
345                 'sub' => sub { feature_bool('grep', @_) },
346                 'override' => 0,
347                 'default' => [1]},
348
349         # Enable the pickaxe search, which will list the commits that modified
350         # a given string in a file. This can be practical and quite faster
351         # alternative to 'blame', but still potentially CPU-intensive.
352         # Note that you need to have 'search' feature enabled too.
353
354         # To enable system wide have in $GITWEB_CONFIG
355         # $feature{'pickaxe'}{'default'} = [1];
356         # To have project specific config enable override in $GITWEB_CONFIG
357         # $feature{'pickaxe'}{'override'} = 1;
358         # and in project config gitweb.pickaxe = 0|1;
359         'pickaxe' => {
360                 'sub' => sub { feature_bool('pickaxe', @_) },
361                 'override' => 0,
362                 'default' => [1]},
363
364         # Enable showing size of blobs in a 'tree' view, in a separate
365         # column, similar to what 'ls -l' does.  This cost a bit of IO.
366
367         # To disable system wide have in $GITWEB_CONFIG
368         # $feature{'show-sizes'}{'default'} = [0];
369         # To have project specific config enable override in $GITWEB_CONFIG
370         # $feature{'show-sizes'}{'override'} = 1;
371         # and in project config gitweb.showsizes = 0|1;
372         'show-sizes' => {
373                 'sub' => sub { feature_bool('showsizes', @_) },
374                 'override' => 0,
375                 'default' => [1]},
376
377         # Make gitweb use an alternative format of the URLs which can be
378         # more readable and natural-looking: project name is embedded
379         # directly in the path and the query string contains other
380         # auxiliary information. All gitweb installations recognize
381         # URL in either format; this configures in which formats gitweb
382         # generates links.
383
384         # To enable system wide have in $GITWEB_CONFIG
385         # $feature{'pathinfo'}{'default'} = [1];
386         # Project specific override is not supported.
387
388         # Note that you will need to change the default location of CSS,
389         # favicon, logo and possibly other files to an absolute URL. Also,
390         # if gitweb.cgi serves as your indexfile, you will need to force
391         # $my_uri to contain the script name in your $GITWEB_CONFIG.
392         'pathinfo' => {
393                 'override' => 0,
394                 'default' => [0]},
395
396         # Make gitweb consider projects in project root subdirectories
397         # to be forks of existing projects. Given project $projname.git,
398         # projects matching $projname/*.git will not be shown in the main
399         # projects list, instead a '+' mark will be added to $projname
400         # there and a 'forks' view will be enabled for the project, listing
401         # all the forks. If project list is taken from a file, forks have
402         # to be listed after the main project.
403
404         # To enable system wide have in $GITWEB_CONFIG
405         # $feature{'forks'}{'default'} = [1];
406         # Project specific override is not supported.
407         'forks' => {
408                 'override' => 0,
409                 'default' => [0]},
410
411         # Insert custom links to the action bar of all project pages.
412         # This enables you mainly to link to third-party scripts integrating
413         # into gitweb; e.g. git-browser for graphical history representation
414         # or custom web-based repository administration interface.
415
416         # The 'default' value consists of a list of triplets in the form
417         # (label, link, position) where position is the label after which
418         # to insert the link and link is a format string where %n expands
419         # to the project name, %f to the project path within the filesystem,
420         # %h to the current hash (h gitweb parameter) and %b to the current
421         # hash base (hb gitweb parameter); %% expands to %.
422
423         # To enable system wide have in $GITWEB_CONFIG e.g.
424         # $feature{'actions'}{'default'} = [('graphiclog',
425         #       '/git-browser/by-commit.html?r=%n', 'summary')];
426         # Project specific override is not supported.
427         'actions' => {
428                 'override' => 0,
429                 'default' => []},
430
431         # Allow gitweb scan project content tags of project repository,
432         # and display the popular Web 2.0-ish "tag cloud" near the projects
433         # list.  Note that this is something COMPLETELY different from the
434         # normal Git tags.
435
436         # gitweb by itself can show existing tags, but it does not handle
437         # tagging itself; you need to do it externally, outside gitweb.
438         # The format is described in git_get_project_ctags() subroutine.
439         # You may want to install the HTML::TagCloud Perl module to get
440         # a pretty tag cloud instead of just a list of tags.
441
442         # To enable system wide have in $GITWEB_CONFIG
443         # $feature{'ctags'}{'default'} = [1];
444         # Project specific override is not supported.
445
446         # In the future whether ctags editing is enabled might depend
447         # on the value, but using 1 should always mean no editing of ctags.
448         'ctags' => {
449                 'override' => 0,
450                 'default' => [0]},
451
452         # The maximum number of patches in a patchset generated in patch
453         # view. Set this to 0 or undef to disable patch view, or to a
454         # negative number to remove any limit.
455
456         # To disable system wide have in $GITWEB_CONFIG
457         # $feature{'patches'}{'default'} = [0];
458         # To have project specific config enable override in $GITWEB_CONFIG
459         # $feature{'patches'}{'override'} = 1;
460         # and in project config gitweb.patches = 0|n;
461         # where n is the maximum number of patches allowed in a patchset.
462         'patches' => {
463                 'sub' => \&feature_patches,
464                 'override' => 0,
465                 'default' => [16]},
466
467         # Avatar support. When this feature is enabled, views such as
468         # shortlog or commit will display an avatar associated with
469         # the email of the committer(s) and/or author(s).
470
471         # Currently available providers are gravatar and picon.
472         # If an unknown provider is specified, the feature is disabled.
473
474         # Gravatar depends on Digest::MD5.
475         # Picon currently relies on the indiana.edu database.
476
477         # To enable system wide have in $GITWEB_CONFIG
478         # $feature{'avatar'}{'default'} = ['<provider>'];
479         # where <provider> is either gravatar or picon.
480         # To have project specific config enable override in $GITWEB_CONFIG
481         # $feature{'avatar'}{'override'} = 1;
482         # and in project config gitweb.avatar = <provider>;
483         'avatar' => {
484                 'sub' => \&feature_avatar,
485                 'override' => 0,
486                 'default' => ['']},
487
488         # Enable displaying how much time and how many git commands
489         # it took to generate and display page.  Disabled by default.
490         # Project specific override is not supported.
491         'timed' => {
492                 'override' => 0,
493                 'default' => [0]},
494
495         # Enable turning some links into links to actions which require
496         # JavaScript to run (like 'blame_incremental').  Not enabled by
497         # default.  Project specific override is currently not supported.
498         'javascript-actions' => {
499                 'override' => 0,
500                 'default' => [0]},
501
502         # Enable and configure ability to change common timezone for dates
503         # in gitweb output via JavaScript.  Enabled by default.
504         # Project specific override is not supported.
505         'javascript-timezone' => {
506                 'override' => 0,
507                 'default' => [
508                         'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
509                                      # or undef to turn off this feature
510                         'gitweb_tz', # name of cookie where to store selected timezone
511                         'datetime',  # CSS class used to mark up dates for manipulation
512                 ]},
513
514         # Syntax highlighting support. This is based on Daniel Svensson's
515         # and Sham Chukoury's work in gitweb-xmms2.git.
516         # It requires the 'highlight' program present in $PATH,
517         # and therefore is disabled by default.
518
519         # To enable system wide have in $GITWEB_CONFIG
520         # $feature{'highlight'}{'default'} = [1];
521
522         'highlight' => {
523                 'sub' => sub { feature_bool('highlight', @_) },
524                 'override' => 0,
525                 'default' => [0]},
526
527         # Enable displaying of remote heads in the heads list
528
529         # To enable system wide have in $GITWEB_CONFIG
530         # $feature{'remote_heads'}{'default'} = [1];
531         # To have project specific config enable override in $GITWEB_CONFIG
532         # $feature{'remote_heads'}{'override'} = 1;
533         # and in project config gitweb.remote_heads = 0|1;
534         'remote_heads' => {
535                 'sub' => sub { feature_bool('remote_heads', @_) },
536                 'override' => 0,
537                 'default' => [0]},
538 );
539
540 sub gitweb_get_feature {
541         my ($name) = @_;
542         return unless exists $feature{$name};
543         my ($sub, $override, @defaults) = (
544                 $feature{$name}{'sub'},
545                 $feature{$name}{'override'},
546                 @{$feature{$name}{'default'}});
547         # project specific override is possible only if we have project
548         our $git_dir; # global variable, declared later
549         if (!$override || !defined $git_dir) {
550                 return @defaults;
551         }
552         if (!defined $sub) {
553                 warn "feature $name is not overridable";
554                 return @defaults;
555         }
556         return $sub->(@defaults);
557 }
558
559 # A wrapper to check if a given feature is enabled.
560 # With this, you can say
561 #
562 #   my $bool_feat = gitweb_check_feature('bool_feat');
563 #   gitweb_check_feature('bool_feat') or somecode;
564 #
565 # instead of
566 #
567 #   my ($bool_feat) = gitweb_get_feature('bool_feat');
568 #   (gitweb_get_feature('bool_feat'))[0] or somecode;
569 #
570 sub gitweb_check_feature {
571         return (gitweb_get_feature(@_))[0];
572 }
573
574
575 sub feature_bool {
576         my $key = shift;
577         my ($val) = git_get_project_config($key, '--bool');
578
579         if (!defined $val) {
580                 return ($_[0]);
581         } elsif ($val eq 'true') {
582                 return (1);
583         } elsif ($val eq 'false') {
584                 return (0);
585         }
586 }
587
588 sub feature_snapshot {
589         my (@fmts) = @_;
590
591         my ($val) = git_get_project_config('snapshot');
592
593         if ($val) {
594                 @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
595         }
596
597         return @fmts;
598 }
599
600 sub feature_patches {
601         my @val = (git_get_project_config('patches', '--int'));
602
603         if (@val) {
604                 return @val;
605         }
606
607         return ($_[0]);
608 }
609
610 sub feature_avatar {
611         my @val = (git_get_project_config('avatar'));
612
613         return @val ? @val : @_;
614 }
615
616 # checking HEAD file with -e is fragile if the repository was
617 # initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
618 # and then pruned.
619 sub check_head_link {
620         my ($dir) = @_;
621         my $headfile = "$dir/HEAD";
622         return ((-e $headfile) ||
623                 (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
624 }
625
626 sub check_export_ok {
627         my ($dir) = @_;
628         return (check_head_link($dir) &&
629                 (!$export_ok || -e "$dir/$export_ok") &&
630                 (!$export_auth_hook || $export_auth_hook->($dir)));
631 }
632
633 # process alternate names for backward compatibility
634 # filter out unsupported (unknown) snapshot formats
635 sub filter_snapshot_fmts {
636         my @fmts = @_;
637
638         @fmts = map {
639                 exists $known_snapshot_format_aliases{$_} ?
640                        $known_snapshot_format_aliases{$_} : $_} @fmts;
641         @fmts = grep {
642                 exists $known_snapshot_formats{$_} &&
643                 !$known_snapshot_formats{$_}{'disabled'}} @fmts;
644 }
645
646 # If it is set to code reference, it is code that it is to be run once per
647 # request, allowing updating configurations that change with each request,
648 # while running other code in config file only once.
649 #
650 # Otherwise, if it is false then gitweb would process config file only once;
651 # if it is true then gitweb config would be run for each request.
652 our $per_request_config = 1;
653
654 # read and parse gitweb config file given by its parameter.
655 # returns true on success, false on recoverable error, allowing
656 # to chain this subroutine, using first file that exists.
657 # dies on errors during parsing config file, as it is unrecoverable.
658 sub read_config_file {
659         my $filename = shift;
660         return unless defined $filename;
661         # die if there are errors parsing config file
662         if (-e $filename) {
663                 do $filename;
664                 die $@ if $@;
665                 return 1;
666         }
667         return;
668 }
669
670 our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
671 sub evaluate_gitweb_config {
672         our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
673         our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
674         our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
675
676         # Protect agains duplications of file names, to not read config twice.
677         # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
678         # there possibility of duplication of filename there doesn't matter.
679         $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
680         $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
681
682         # Common system-wide settings for convenience.
683         # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
684         read_config_file($GITWEB_CONFIG_COMMON);
685
686         # Use first config file that exists.  This means use the per-instance
687         # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
688         read_config_file($GITWEB_CONFIG) and return;
689         read_config_file($GITWEB_CONFIG_SYSTEM);
690 }
691
692 # Get loadavg of system, to compare against $maxload.
693 # Currently it requires '/proc/loadavg' present to get loadavg;
694 # if it is not present it returns 0, which means no load checking.
695 sub get_loadavg {
696         if( -e '/proc/loadavg' ){
697                 open my $fd, '<', '/proc/loadavg'
698                         or return 0;
699                 my @load = split(/\s+/, scalar <$fd>);
700                 close $fd;
701
702                 # The first three columns measure CPU and IO utilization of the last one,
703                 # five, and 10 minute periods.  The fourth column shows the number of
704                 # currently running processes and the total number of processes in the m/n
705                 # format.  The last column displays the last process ID used.
706                 return $load[0] || 0;
707         }
708         # additional checks for load average should go here for things that don't export
709         # /proc/loadavg
710
711         return 0;
712 }
713
714 # version of the core git binary
715 our $git_version;
716 sub evaluate_git_version {
717         our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
718         $number_of_git_cmds++;
719 }
720
721 sub check_loadavg {
722         if (defined $maxload && get_loadavg() > $maxload) {
723                 die_error(503, "The load average on the server is too high");
724         }
725 }
726
727 # ======================================================================
728 # input validation and dispatch
729
730 # input parameters can be collected from a variety of sources (presently, CGI
731 # and PATH_INFO), so we define an %input_params hash that collects them all
732 # together during validation: this allows subsequent uses (e.g. href()) to be
733 # agnostic of the parameter origin
734
735 our %input_params = ();
736
737 # input parameters are stored with the long parameter name as key. This will
738 # also be used in the href subroutine to convert parameters to their CGI
739 # equivalent, and since the href() usage is the most frequent one, we store
740 # the name -> CGI key mapping here, instead of the reverse.
741 #
742 # XXX: Warning: If you touch this, check the search form for updating,
743 # too.
744
745 our @cgi_param_mapping = (
746         project => "p",
747         action => "a",
748         file_name => "f",
749         file_parent => "fp",
750         hash => "h",
751         hash_parent => "hp",
752         hash_base => "hb",
753         hash_parent_base => "hpb",
754         page => "pg",
755         order => "o",
756         searchtext => "s",
757         searchtype => "st",
758         snapshot_format => "sf",
759         extra_options => "opt",
760         search_use_regexp => "sr",
761         ctag => "by_tag",
762         # this must be last entry (for manipulation from JavaScript)
763         javascript => "js"
764 );
765 our %cgi_param_mapping = @cgi_param_mapping;
766
767 # we will also need to know the possible actions, for validation
768 our %actions = (
769         "blame" => \&git_blame,
770         "blame_incremental" => \&git_blame_incremental,
771         "blame_data" => \&git_blame_data,
772         "blobdiff" => \&git_blobdiff,
773         "blobdiff_plain" => \&git_blobdiff_plain,
774         "blob" => \&git_blob,
775         "blob_plain" => \&git_blob_plain,
776         "commitdiff" => \&git_commitdiff,
777         "commitdiff_plain" => \&git_commitdiff_plain,
778         "commit" => \&git_commit,
779         "forks" => \&git_forks,
780         "heads" => \&git_heads,
781         "history" => \&git_history,
782         "log" => \&git_log,
783         "patch" => \&git_patch,
784         "patches" => \&git_patches,
785         "remotes" => \&git_remotes,
786         "rss" => \&git_rss,
787         "atom" => \&git_atom,
788         "search" => \&git_search,
789         "search_help" => \&git_search_help,
790         "shortlog" => \&git_shortlog,
791         "summary" => \&git_summary,
792         "tag" => \&git_tag,
793         "tags" => \&git_tags,
794         "tree" => \&git_tree,
795         "snapshot" => \&git_snapshot,
796         "object" => \&git_object,
797         # those below don't need $project
798         "opml" => \&git_opml,
799         "project_list" => \&git_project_list,
800         "project_index" => \&git_project_index,
801 );
802
803 # finally, we have the hash of allowed extra_options for the commands that
804 # allow them
805 our %allowed_options = (
806         "--no-merges" => [ qw(rss atom log shortlog history) ],
807 );
808
809 # fill %input_params with the CGI parameters. All values except for 'opt'
810 # should be single values, but opt can be an array. We should probably
811 # build an array of parameters that can be multi-valued, but since for the time
812 # being it's only this one, we just single it out
813 sub evaluate_query_params {
814         our $cgi;
815
816         while (my ($name, $symbol) = each %cgi_param_mapping) {
817                 if ($symbol eq 'opt') {
818                         $input_params{$name} = [ $cgi->param($symbol) ];
819                 } else {
820                         $input_params{$name} = $cgi->param($symbol);
821                 }
822         }
823 }
824
825 # now read PATH_INFO and update the parameter list for missing parameters
826 sub evaluate_path_info {
827         return if defined $input_params{'project'};
828         return if !$path_info;
829         $path_info =~ s,^/+,,;
830         return if !$path_info;
831
832         # find which part of PATH_INFO is project
833         my $project = $path_info;
834         $project =~ s,/+$,,;
835         while ($project && !check_head_link("$projectroot/$project")) {
836                 $project =~ s,/*[^/]*$,,;
837         }
838         return unless $project;
839         $input_params{'project'} = $project;
840
841         # do not change any parameters if an action is given using the query string
842         return if $input_params{'action'};
843         $path_info =~ s,^\Q$project\E/*,,;
844
845         # next, check if we have an action
846         my $action = $path_info;
847         $action =~ s,/.*$,,;
848         if (exists $actions{$action}) {
849                 $path_info =~ s,^$action/*,,;
850                 $input_params{'action'} = $action;
851         }
852
853         # list of actions that want hash_base instead of hash, but can have no
854         # pathname (f) parameter
855         my @wants_base = (
856                 'tree',
857                 'history',
858         );
859
860         # we want to catch, among others
861         # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
862         my ($parentrefname, $parentpathname, $refname, $pathname) =
863                 ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
864
865         # first, analyze the 'current' part
866         if (defined $pathname) {
867                 # we got "branch:filename" or "branch:dir/"
868                 # we could use git_get_type(branch:pathname), but:
869                 # - it needs $git_dir
870                 # - it does a git() call
871                 # - the convention of terminating directories with a slash
872                 #   makes it superfluous
873                 # - embedding the action in the PATH_INFO would make it even
874                 #   more superfluous
875                 $pathname =~ s,^/+,,;
876                 if (!$pathname || substr($pathname, -1) eq "/") {
877                         $input_params{'action'} ||= "tree";
878                         $pathname =~ s,/$,,;
879                 } else {
880                         # the default action depends on whether we had parent info
881                         # or not
882                         if ($parentrefname) {
883                                 $input_params{'action'} ||= "blobdiff_plain";
884                         } else {
885                                 $input_params{'action'} ||= "blob_plain";
886                         }
887                 }
888                 $input_params{'hash_base'} ||= $refname;
889                 $input_params{'file_name'} ||= $pathname;
890         } elsif (defined $refname) {
891                 # we got "branch". In this case we have to choose if we have to
892                 # set hash or hash_base.
893                 #
894                 # Most of the actions without a pathname only want hash to be
895                 # set, except for the ones specified in @wants_base that want
896                 # hash_base instead. It should also be noted that hand-crafted
897                 # links having 'history' as an action and no pathname or hash
898                 # set will fail, but that happens regardless of PATH_INFO.
899                 if (defined $parentrefname) {
900                         # if there is parent let the default be 'shortlog' action
901                         # (for http://git.example.com/repo.git/A..B links); if there
902                         # is no parent, dispatch will detect type of object and set
903                         # action appropriately if required (if action is not set)
904                         $input_params{'action'} ||= "shortlog";
905                 }
906                 if ($input_params{'action'} &&
907                     grep { $_ eq $input_params{'action'} } @wants_base) {
908                         $input_params{'hash_base'} ||= $refname;
909                 } else {
910                         $input_params{'hash'} ||= $refname;
911                 }
912         }
913
914         # next, handle the 'parent' part, if present
915         if (defined $parentrefname) {
916                 # a missing pathspec defaults to the 'current' filename, allowing e.g.
917                 # someproject/blobdiff/oldrev..newrev:/filename
918                 if ($parentpathname) {
919                         $parentpathname =~ s,^/+,,;
920                         $parentpathname =~ s,/$,,;
921                         $input_params{'file_parent'} ||= $parentpathname;
922                 } else {
923                         $input_params{'file_parent'} ||= $input_params{'file_name'};
924                 }
925                 # we assume that hash_parent_base is wanted if a path was specified,
926                 # or if the action wants hash_base instead of hash
927                 if (defined $input_params{'file_parent'} ||
928                         grep { $_ eq $input_params{'action'} } @wants_base) {
929                         $input_params{'hash_parent_base'} ||= $parentrefname;
930                 } else {
931                         $input_params{'hash_parent'} ||= $parentrefname;
932                 }
933         }
934
935         # for the snapshot action, we allow URLs in the form
936         # $project/snapshot/$hash.ext
937         # where .ext determines the snapshot and gets removed from the
938         # passed $refname to provide the $hash.
939         #
940         # To be able to tell that $refname includes the format extension, we
941         # require the following two conditions to be satisfied:
942         # - the hash input parameter MUST have been set from the $refname part
943         #   of the URL (i.e. they must be equal)
944         # - the snapshot format MUST NOT have been defined already (e.g. from
945         #   CGI parameter sf)
946         # It's also useless to try any matching unless $refname has a dot,
947         # so we check for that too
948         if (defined $input_params{'action'} &&
949                 $input_params{'action'} eq 'snapshot' &&
950                 defined $refname && index($refname, '.') != -1 &&
951                 $refname eq $input_params{'hash'} &&
952                 !defined $input_params{'snapshot_format'}) {
953                 # We loop over the known snapshot formats, checking for
954                 # extensions. Allowed extensions are both the defined suffix
955                 # (which includes the initial dot already) and the snapshot
956                 # format key itself, with a prepended dot
957                 while (my ($fmt, $opt) = each %known_snapshot_formats) {
958                         my $hash = $refname;
959                         unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
960                                 next;
961                         }
962                         my $sfx = $1;
963                         # a valid suffix was found, so set the snapshot format
964                         # and reset the hash parameter
965                         $input_params{'snapshot_format'} = $fmt;
966                         $input_params{'hash'} = $hash;
967                         # we also set the format suffix to the one requested
968                         # in the URL: this way a request for e.g. .tgz returns
969                         # a .tgz instead of a .tar.gz
970                         $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
971                         last;
972                 }
973         }
974 }
975
976 our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
977      $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
978      $searchtext, $search_regexp);
979 sub evaluate_and_validate_params {
980         our $action = $input_params{'action'};
981         if (defined $action) {
982                 if (!validate_action($action)) {
983                         die_error(400, "Invalid action parameter");
984                 }
985         }
986
987         # parameters which are pathnames
988         our $project = $input_params{'project'};
989         if (defined $project) {
990                 if (!validate_project($project)) {
991                         undef $project;
992                         die_error(404, "No such project");
993                 }
994         }
995
996         our $file_name = $input_params{'file_name'};
997         if (defined $file_name) {
998                 if (!validate_pathname($file_name)) {
999                         die_error(400, "Invalid file parameter");
1000                 }
1001         }
1002
1003         our $file_parent = $input_params{'file_parent'};
1004         if (defined $file_parent) {
1005                 if (!validate_pathname($file_parent)) {
1006                         die_error(400, "Invalid file parent parameter");
1007                 }
1008         }
1009
1010         # parameters which are refnames
1011         our $hash = $input_params{'hash'};
1012         if (defined $hash) {
1013                 if (!validate_refname($hash)) {
1014                         die_error(400, "Invalid hash parameter");
1015                 }
1016         }
1017
1018         our $hash_parent = $input_params{'hash_parent'};
1019         if (defined $hash_parent) {
1020                 if (!validate_refname($hash_parent)) {
1021                         die_error(400, "Invalid hash parent parameter");
1022                 }
1023         }
1024
1025         our $hash_base = $input_params{'hash_base'};
1026         if (defined $hash_base) {
1027                 if (!validate_refname($hash_base)) {
1028                         die_error(400, "Invalid hash base parameter");
1029                 }
1030         }
1031
1032         our @extra_options = @{$input_params{'extra_options'}};
1033         # @extra_options is always defined, since it can only be (currently) set from
1034         # CGI, and $cgi->param() returns the empty array in array context if the param
1035         # is not set
1036         foreach my $opt (@extra_options) {
1037                 if (not exists $allowed_options{$opt}) {
1038                         die_error(400, "Invalid option parameter");
1039                 }
1040                 if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1041                         die_error(400, "Invalid option parameter for this action");
1042                 }
1043         }
1044
1045         our $hash_parent_base = $input_params{'hash_parent_base'};
1046         if (defined $hash_parent_base) {
1047                 if (!validate_refname($hash_parent_base)) {
1048                         die_error(400, "Invalid hash parent base parameter");
1049                 }
1050         }
1051
1052         # other parameters
1053         our $page = $input_params{'page'};
1054         if (defined $page) {
1055                 if ($page =~ m/[^0-9]/) {
1056                         die_error(400, "Invalid page parameter");
1057                 }
1058         }
1059
1060         our $searchtype = $input_params{'searchtype'};
1061         if (defined $searchtype) {
1062                 if ($searchtype =~ m/[^a-z]/) {
1063                         die_error(400, "Invalid searchtype parameter");
1064                 }
1065         }
1066
1067         our $search_use_regexp = $input_params{'search_use_regexp'};
1068
1069         our $searchtext = $input_params{'searchtext'};
1070         our $search_regexp;
1071         if (defined $searchtext) {
1072                 if (length($searchtext) < 2) {
1073                         die_error(403, "At least two characters are required for search parameter");
1074                 }
1075                 $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
1076         }
1077 }
1078
1079 # path to the current git repository
1080 our $git_dir;
1081 sub evaluate_git_dir {
1082         our $git_dir = "$projectroot/$project" if $project;
1083 }
1084
1085 our (@snapshot_fmts, $git_avatar);
1086 sub configure_gitweb_features {
1087         # list of supported snapshot formats
1088         our @snapshot_fmts = gitweb_get_feature('snapshot');
1089         @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1090
1091         # check that the avatar feature is set to a known provider name,
1092         # and for each provider check if the dependencies are satisfied.
1093         # if the provider name is invalid or the dependencies are not met,
1094         # reset $git_avatar to the empty string.
1095         our ($git_avatar) = gitweb_get_feature('avatar');
1096         if ($git_avatar eq 'gravatar') {
1097                 $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1098         } elsif ($git_avatar eq 'picon') {
1099                 # no dependencies
1100         } else {
1101                 $git_avatar = '';
1102         }
1103 }
1104
1105 # custom error handler: 'die <message>' is Internal Server Error
1106 sub handle_errors_html {
1107         my $msg = shift; # it is already HTML escaped
1108
1109         # to avoid infinite loop where error occurs in die_error,
1110         # change handler to default handler, disabling handle_errors_html
1111         set_message("Error occured when inside die_error:\n$msg");
1112
1113         # you cannot jump out of die_error when called as error handler;
1114         # the subroutine set via CGI::Carp::set_message is called _after_
1115         # HTTP headers are already written, so it cannot write them itself
1116         die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1117 }
1118 set_message(\&handle_errors_html);
1119
1120 # dispatch
1121 sub dispatch {
1122         if (!defined $action) {
1123                 if (defined $hash) {
1124                         $action = git_get_type($hash);
1125                 } elsif (defined $hash_base && defined $file_name) {
1126                         $action = git_get_type("$hash_base:$file_name");
1127                 } elsif (defined $project) {
1128                         $action = 'summary';
1129                 } else {
1130                         $action = 'project_list';
1131                 }
1132         }
1133         if (!defined($actions{$action})) {
1134                 die_error(400, "Unknown action");
1135         }
1136         if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1137             !$project) {
1138                 die_error(400, "Project needed");
1139         }
1140         $actions{$action}->();
1141 }
1142
1143 sub reset_timer {
1144         our $t0 = [ gettimeofday() ]
1145                 if defined $t0;
1146         our $number_of_git_cmds = 0;
1147 }
1148
1149 our $first_request = 1;
1150 sub run_request {
1151         reset_timer();
1152
1153         evaluate_uri();
1154         if ($first_request) {
1155                 evaluate_gitweb_config();
1156                 evaluate_git_version();
1157         }
1158         if ($per_request_config) {
1159                 if (ref($per_request_config) eq 'CODE') {
1160                         $per_request_config->();
1161                 } elsif (!$first_request) {
1162                         evaluate_gitweb_config();
1163                 }
1164         }
1165         check_loadavg();
1166
1167         # $projectroot and $projects_list might be set in gitweb config file
1168         $projects_list ||= $projectroot;
1169
1170         evaluate_query_params();
1171         evaluate_path_info();
1172         evaluate_and_validate_params();
1173         evaluate_git_dir();
1174
1175         configure_gitweb_features();
1176
1177         dispatch();
1178 }
1179
1180 our $is_last_request = sub { 1 };
1181 our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1182 our $CGI = 'CGI';
1183 our $cgi;
1184 sub configure_as_fcgi {
1185         require CGI::Fast;
1186         our $CGI = 'CGI::Fast';
1187
1188         my $request_number = 0;
1189         # let each child service 100 requests
1190         our $is_last_request = sub { ++$request_number > 100 };
1191 }
1192 sub evaluate_argv {
1193         my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1194         configure_as_fcgi()
1195                 if $script_name =~ /\.fcgi$/;
1196
1197         return unless (@ARGV);
1198
1199         require Getopt::Long;
1200         Getopt::Long::GetOptions(
1201                 'fastcgi|fcgi|f' => \&configure_as_fcgi,
1202                 'nproc|n=i' => sub {
1203                         my ($arg, $val) = @_;
1204                         return unless eval { require FCGI::ProcManager; 1; };
1205                         my $proc_manager = FCGI::ProcManager->new({
1206                                 n_processes => $val,
1207                         });
1208                         our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1209                         our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1210                         our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1211                 },
1212         );
1213 }
1214
1215 sub run {
1216         evaluate_argv();
1217
1218         $first_request = 1;
1219         $pre_listen_hook->()
1220                 if $pre_listen_hook;
1221
1222  REQUEST:
1223         while ($cgi = $CGI->new()) {
1224                 $pre_dispatch_hook->()
1225                         if $pre_dispatch_hook;
1226
1227                 run_request();
1228
1229                 $post_dispatch_hook->()
1230                         if $post_dispatch_hook;
1231                 $first_request = 0;
1232
1233                 last REQUEST if ($is_last_request->());
1234         }
1235
1236  DONE_GITWEB:
1237         1;
1238 }
1239
1240 run();
1241
1242 if (defined caller) {
1243         # wrapped in a subroutine processing requests,
1244         # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1245         return;
1246 } else {
1247         # pure CGI script, serving single request
1248         exit;
1249 }
1250
1251 ## ======================================================================
1252 ## action links
1253
1254 # possible values of extra options
1255 # -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1256 # -replay => 1      - start from a current view (replay with modifications)
1257 # -path_info => 0|1 - don't use/use path_info URL (if possible)
1258 # -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1259 sub href {
1260         my %params = @_;
1261         # default is to use -absolute url() i.e. $my_uri
1262         my $href = $params{-full} ? $my_url : $my_uri;
1263
1264         # implicit -replay, must be first of implicit params
1265         $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1266
1267         $params{'project'} = $project unless exists $params{'project'};
1268
1269         if ($params{-replay}) {
1270                 while (my ($name, $symbol) = each %cgi_param_mapping) {
1271                         if (!exists $params{$name}) {
1272                                 $params{$name} = $input_params{$name};
1273                         }
1274                 }
1275         }
1276
1277         my $use_pathinfo = gitweb_check_feature('pathinfo');
1278         if (defined $params{'project'} &&
1279             (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1280                 # try to put as many parameters as possible in PATH_INFO:
1281                 #   - project name
1282                 #   - action
1283                 #   - hash_parent or hash_parent_base:/file_parent
1284                 #   - hash or hash_base:/filename
1285                 #   - the snapshot_format as an appropriate suffix
1286
1287                 # When the script is the root DirectoryIndex for the domain,
1288                 # $href here would be something like http://gitweb.example.com/
1289                 # Thus, we strip any trailing / from $href, to spare us double
1290                 # slashes in the final URL
1291                 $href =~ s,/$,,;
1292
1293                 # Then add the project name, if present
1294                 $href .= "/".esc_path_info($params{'project'});
1295                 delete $params{'project'};
1296
1297                 # since we destructively absorb parameters, we keep this
1298                 # boolean that remembers if we're handling a snapshot
1299                 my $is_snapshot = $params{'action'} eq 'snapshot';
1300
1301                 # Summary just uses the project path URL, any other action is
1302                 # added to the URL
1303                 if (defined $params{'action'}) {
1304                         $href .= "/".esc_path_info($params{'action'})
1305                                 unless $params{'action'} eq 'summary';
1306                         delete $params{'action'};
1307                 }
1308
1309                 # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1310                 # stripping nonexistent or useless pieces
1311                 $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1312                         || $params{'hash_parent'} || $params{'hash'});
1313                 if (defined $params{'hash_base'}) {
1314                         if (defined $params{'hash_parent_base'}) {
1315                                 $href .= esc_path_info($params{'hash_parent_base'});
1316                                 # skip the file_parent if it's the same as the file_name
1317                                 if (defined $params{'file_parent'}) {
1318                                         if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1319                                                 delete $params{'file_parent'};
1320                                         } elsif ($params{'file_parent'} !~ /\.\./) {
1321                                                 $href .= ":/".esc_path_info($params{'file_parent'});
1322                                                 delete $params{'file_parent'};
1323                                         }
1324                                 }
1325                                 $href .= "..";
1326                                 delete $params{'hash_parent'};
1327                                 delete $params{'hash_parent_base'};
1328                         } elsif (defined $params{'hash_parent'}) {
1329                                 $href .= esc_path_info($params{'hash_parent'}). "..";
1330                                 delete $params{'hash_parent'};
1331                         }
1332
1333                         $href .= esc_path_info($params{'hash_base'});
1334                         if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1335                                 $href .= ":/".esc_path_info($params{'file_name'});
1336                                 delete $params{'file_name'};
1337                         }
1338                         delete $params{'hash'};
1339                         delete $params{'hash_base'};
1340                 } elsif (defined $params{'hash'}) {
1341                         $href .= esc_path_info($params{'hash'});
1342                         delete $params{'hash'};
1343                 }
1344
1345                 # If the action was a snapshot, we can absorb the
1346                 # snapshot_format parameter too
1347                 if ($is_snapshot) {
1348                         my $fmt = $params{'snapshot_format'};
1349                         # snapshot_format should always be defined when href()
1350                         # is called, but just in case some code forgets, we
1351                         # fall back to the default
1352                         $fmt ||= $snapshot_fmts[0];
1353                         $href .= $known_snapshot_formats{$fmt}{'suffix'};
1354                         delete $params{'snapshot_format'};
1355                 }
1356         }
1357
1358         # now encode the parameters explicitly
1359         my @result = ();
1360         for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1361                 my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1362                 if (defined $params{$name}) {
1363                         if (ref($params{$name}) eq "ARRAY") {
1364                                 foreach my $par (@{$params{$name}}) {
1365                                         push @result, $symbol . "=" . esc_param($par);
1366                                 }
1367                         } else {
1368                                 push @result, $symbol . "=" . esc_param($params{$name});
1369                         }
1370                 }
1371         }
1372         $href .= "?" . join(';', @result) if scalar @result;
1373
1374         # final transformation: trailing spaces must be escaped (URI-encoded)
1375         $href =~ s/(\s+)$/CGI::escape($1)/e;
1376
1377         if ($params{-anchor}) {
1378                 $href .= "#".esc_param($params{-anchor});
1379         }
1380
1381         return $href;
1382 }
1383
1384
1385 ## ======================================================================
1386 ## validation, quoting/unquoting and escaping
1387
1388 sub validate_action {
1389         my $input = shift || return undef;
1390         return undef unless exists $actions{$input};
1391         return $input;
1392 }
1393
1394 sub validate_project {
1395         my $input = shift || return undef;
1396         if (!validate_pathname($input) ||
1397                 !(-d "$projectroot/$input") ||
1398                 !check_export_ok("$projectroot/$input") ||
1399                 ($strict_export && !project_in_list($input))) {
1400                 return undef;
1401         } else {
1402                 return $input;
1403         }
1404 }
1405
1406 sub validate_pathname {
1407         my $input = shift || return undef;
1408
1409         # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1410         # at the beginning, at the end, and between slashes.
1411         # also this catches doubled slashes
1412         if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1413                 return undef;
1414         }
1415         # no null characters
1416         if ($input =~ m!\0!) {
1417                 return undef;
1418         }
1419         return $input;
1420 }
1421
1422 sub validate_refname {
1423         my $input = shift || return undef;
1424
1425         # textual hashes are O.K.
1426         if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1427                 return $input;
1428         }
1429         # it must be correct pathname
1430         $input = validate_pathname($input)
1431                 or return undef;
1432         # restrictions on ref name according to git-check-ref-format
1433         if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1434                 return undef;
1435         }
1436         return $input;
1437 }
1438
1439 # decode sequences of octets in utf8 into Perl's internal form,
1440 # which is utf-8 with utf8 flag set if needed.  gitweb writes out
1441 # in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1442 sub to_utf8 {
1443         my $str = shift;
1444         return undef unless defined $str;
1445         if (utf8::valid($str)) {
1446                 utf8::decode($str);
1447                 return $str;
1448         } else {
1449                 return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1450         }
1451 }
1452
1453 # quote unsafe chars, but keep the slash, even when it's not
1454 # correct, but quoted slashes look too horrible in bookmarks
1455 sub esc_param {
1456         my $str = shift;
1457         return undef unless defined $str;
1458         $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1459         $str =~ s/ /\+/g;
1460         return $str;
1461 }
1462
1463 # the quoting rules for path_info fragment are slightly different
1464 sub esc_path_info {
1465         my $str = shift;
1466         return undef unless defined $str;
1467
1468         # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1469         $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1470
1471         return $str;
1472 }
1473
1474 # quote unsafe chars in whole URL, so some characters cannot be quoted
1475 sub esc_url {
1476         my $str = shift;
1477         return undef unless defined $str;
1478         $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1479         $str =~ s/ /\+/g;
1480         return $str;
1481 }
1482
1483 # quote unsafe characters in HTML attributes
1484 sub esc_attr {
1485
1486         # for XHTML conformance escaping '"' to '&quot;' is not enough
1487         return esc_html(@_);
1488 }
1489
1490 # replace invalid utf8 character with SUBSTITUTION sequence
1491 sub esc_html {
1492         my $str = shift;
1493         my %opts = @_;
1494
1495         return undef unless defined $str;
1496
1497         $str = to_utf8($str);
1498         $str = $cgi->escapeHTML($str);
1499         if ($opts{'-nbsp'}) {
1500                 $str =~ s/ /&nbsp;/g;
1501         }
1502         $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1503         return $str;
1504 }
1505
1506 # quote control characters and escape filename to HTML
1507 sub esc_path {
1508         my $str = shift;
1509         my %opts = @_;
1510
1511         return undef unless defined $str;
1512
1513         $str = to_utf8($str);
1514         $str = $cgi->escapeHTML($str);
1515         if ($opts{'-nbsp'}) {
1516                 $str =~ s/ /&nbsp;/g;
1517         }
1518         $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1519         return $str;
1520 }
1521
1522 # Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1523 sub sanitize {
1524         my $str = shift;
1525
1526         return undef unless defined $str;
1527
1528         $str = to_utf8($str);
1529         $str =~ s|([[:cntrl:]])|($1 =~ /[\t\n\r]/ ? $1 : quot_cec($1))|eg;
1530         return $str;
1531 }
1532
1533 # Make control characters "printable", using character escape codes (CEC)
1534 sub quot_cec {
1535         my $cntrl = shift;
1536         my %opts = @_;
1537         my %es = ( # character escape codes, aka escape sequences
1538                 "\t" => '\t',   # tab            (HT)
1539                 "\n" => '\n',   # line feed      (LF)
1540                 "\r" => '\r',   # carrige return (CR)
1541                 "\f" => '\f',   # form feed      (FF)
1542                 "\b" => '\b',   # backspace      (BS)
1543                 "\a" => '\a',   # alarm (bell)   (BEL)
1544                 "\e" => '\e',   # escape         (ESC)
1545                 "\013" => '\v', # vertical tab   (VT)
1546                 "\000" => '\0', # nul character  (NUL)
1547         );
1548         my $chr = ( (exists $es{$cntrl})
1549                     ? $es{$cntrl}
1550                     : sprintf('\%2x', ord($cntrl)) );
1551         if ($opts{-nohtml}) {
1552                 return $chr;
1553         } else {
1554                 return "<span class=\"cntrl\">$chr</span>";
1555         }
1556 }
1557
1558 # Alternatively use unicode control pictures codepoints,
1559 # Unicode "printable representation" (PR)
1560 sub quot_upr {
1561         my $cntrl = shift;
1562         my %opts = @_;
1563
1564         my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1565         if ($opts{-nohtml}) {
1566                 return $chr;
1567         } else {
1568                 return "<span class=\"cntrl\">$chr</span>";
1569         }
1570 }
1571
1572 # git may return quoted and escaped filenames
1573 sub unquote {
1574         my $str = shift;
1575
1576         sub unq {
1577                 my $seq = shift;
1578                 my %es = ( # character escape codes, aka escape sequences
1579                         't' => "\t",   # tab            (HT, TAB)
1580                         'n' => "\n",   # newline        (NL)
1581                         'r' => "\r",   # return         (CR)
1582                         'f' => "\f",   # form feed      (FF)
1583                         'b' => "\b",   # backspace      (BS)
1584                         'a' => "\a",   # alarm (bell)   (BEL)
1585                         'e' => "\e",   # escape         (ESC)
1586                         'v' => "\013", # vertical tab   (VT)
1587                 );
1588
1589                 if ($seq =~ m/^[0-7]{1,3}$/) {
1590                         # octal char sequence
1591                         return chr(oct($seq));
1592                 } elsif (exists $es{$seq}) {
1593                         # C escape sequence, aka character escape code
1594                         return $es{$seq};
1595                 }
1596                 # quoted ordinary character
1597                 return $seq;
1598         }
1599
1600         if ($str =~ m/^"(.*)"$/) {
1601                 # needs unquoting
1602                 $str = $1;
1603                 $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1604         }
1605         return $str;
1606 }
1607
1608 # escape tabs (convert tabs to spaces)
1609 sub untabify {
1610         my $line = shift;
1611
1612         while ((my $pos = index($line, "\t")) != -1) {
1613                 if (my $count = (8 - ($pos % 8))) {
1614                         my $spaces = ' ' x $count;
1615                         $line =~ s/\t/$spaces/;
1616                 }
1617         }
1618
1619         return $line;
1620 }
1621
1622 sub project_in_list {
1623         my $project = shift;
1624         my @list = git_get_projects_list();
1625         return @list && scalar(grep { $_->{'path'} eq $project } @list);
1626 }
1627
1628 ## ----------------------------------------------------------------------
1629 ## HTML aware string manipulation
1630
1631 # Try to chop given string on a word boundary between position
1632 # $len and $len+$add_len. If there is no word boundary there,
1633 # chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1634 # (marking chopped part) would be longer than given string.
1635 sub chop_str {
1636         my $str = shift;
1637         my $len = shift;
1638         my $add_len = shift || 10;
1639         my $where = shift || 'right'; # 'left' | 'center' | 'right'
1640
1641         # Make sure perl knows it is utf8 encoded so we don't
1642         # cut in the middle of a utf8 multibyte char.
1643         $str = to_utf8($str);
1644
1645         # allow only $len chars, but don't cut a word if it would fit in $add_len
1646         # if it doesn't fit, cut it if it's still longer than the dots we would add
1647         # remove chopped character entities entirely
1648
1649         # when chopping in the middle, distribute $len into left and right part
1650         # return early if chopping wouldn't make string shorter
1651         if ($where eq 'center') {
1652                 return $str if ($len + 5 >= length($str)); # filler is length 5
1653                 $len = int($len/2);
1654         } else {
1655                 return $str if ($len + 4 >= length($str)); # filler is length 4
1656         }
1657
1658         # regexps: ending and beginning with word part up to $add_len
1659         my $endre = qr/.{$len}\w{0,$add_len}/;
1660         my $begre = qr/\w{0,$add_len}.{$len}/;
1661
1662         if ($where eq 'left') {
1663                 $str =~ m/^(.*?)($begre)$/;
1664                 my ($lead, $body) = ($1, $2);
1665                 if (length($lead) > 4) {
1666                         $lead = " ...";
1667                 }
1668                 return "$lead$body";
1669
1670         } elsif ($where eq 'center') {
1671                 $str =~ m/^($endre)(.*)$/;
1672                 my ($left, $str)  = ($1, $2);
1673                 $str =~ m/^(.*?)($begre)$/;
1674                 my ($mid, $right) = ($1, $2);
1675                 if (length($mid) > 5) {
1676                         $mid = " ... ";
1677                 }
1678                 return "$left$mid$right";
1679
1680         } else {
1681                 $str =~ m/^($endre)(.*)$/;
1682                 my $body = $1;
1683                 my $tail = $2;
1684                 if (length($tail) > 4) {
1685                         $tail = "... ";
1686                 }
1687                 return "$body$tail";
1688         }
1689 }
1690
1691 # takes the same arguments as chop_str, but also wraps a <span> around the
1692 # result with a title attribute if it does get chopped. Additionally, the
1693 # string is HTML-escaped.
1694 sub chop_and_escape_str {
1695         my ($str) = @_;
1696
1697         my $chopped = chop_str(@_);
1698         if ($chopped eq $str) {
1699                 return esc_html($chopped);
1700         } else {
1701                 $str =~ s/[[:cntrl:]]/?/g;
1702                 return $cgi->span({-title=>$str}, esc_html($chopped));
1703         }
1704 }
1705
1706 ## ----------------------------------------------------------------------
1707 ## functions returning short strings
1708
1709 # CSS class for given age value (in seconds)
1710 sub age_class {
1711         my $age = shift;
1712
1713         if (!defined $age) {
1714                 return "noage";
1715         } elsif ($age < 60*60*2) {
1716                 return "age0";
1717         } elsif ($age < 60*60*24*2) {
1718                 return "age1";
1719         } else {
1720                 return "age2";
1721         }
1722 }
1723
1724 # convert age in seconds to "nn units ago" string
1725 sub age_string {
1726         my $age = shift;
1727         my $age_str;
1728
1729         if ($age > 60*60*24*365*2) {
1730                 $age_str = (int $age/60/60/24/365);
1731                 $age_str .= " years ago";
1732         } elsif ($age > 60*60*24*(365/12)*2) {
1733                 $age_str = int $age/60/60/24/(365/12);
1734                 $age_str .= " months ago";
1735         } elsif ($age > 60*60*24*7*2) {
1736                 $age_str = int $age/60/60/24/7;
1737                 $age_str .= " weeks ago";
1738         } elsif ($age > 60*60*24*2) {
1739                 $age_str = int $age/60/60/24;
1740                 $age_str .= " days ago";
1741         } elsif ($age > 60*60*2) {
1742                 $age_str = int $age/60/60;
1743                 $age_str .= " hours ago";
1744         } elsif ($age > 60*2) {
1745                 $age_str = int $age/60;
1746                 $age_str .= " min ago";
1747         } elsif ($age > 2) {
1748                 $age_str = int $age;
1749                 $age_str .= " sec ago";
1750         } else {
1751                 $age_str .= " right now";
1752         }
1753         return $age_str;
1754 }
1755
1756 use constant {
1757         S_IFINVALID => 0030000,
1758         S_IFGITLINK => 0160000,
1759 };
1760
1761 # submodule/subproject, a commit object reference
1762 sub S_ISGITLINK {
1763         my $mode = shift;
1764
1765         return (($mode & S_IFMT) == S_IFGITLINK)
1766 }
1767
1768 # convert file mode in octal to symbolic file mode string
1769 sub mode_str {
1770         my $mode = oct shift;
1771
1772         if (S_ISGITLINK($mode)) {
1773                 return 'm---------';
1774         } elsif (S_ISDIR($mode & S_IFMT)) {
1775                 return 'drwxr-xr-x';
1776         } elsif (S_ISLNK($mode)) {
1777                 return 'lrwxrwxrwx';
1778         } elsif (S_ISREG($mode)) {
1779                 # git cares only about the executable bit
1780                 if ($mode & S_IXUSR) {
1781                         return '-rwxr-xr-x';
1782                 } else {
1783                         return '-rw-r--r--';
1784                 };
1785         } else {
1786                 return '----------';
1787         }
1788 }
1789
1790 # convert file mode in octal to file type string
1791 sub file_type {
1792         my $mode = shift;
1793
1794         if ($mode !~ m/^[0-7]+$/) {
1795                 return $mode;
1796         } else {
1797                 $mode = oct $mode;
1798         }
1799
1800         if (S_ISGITLINK($mode)) {
1801                 return "submodule";
1802         } elsif (S_ISDIR($mode & S_IFMT)) {
1803                 return "directory";
1804         } elsif (S_ISLNK($mode)) {
1805                 return "symlink";
1806         } elsif (S_ISREG($mode)) {
1807                 return "file";
1808         } else {
1809                 return "unknown";
1810         }
1811 }
1812
1813 # convert file mode in octal to file type description string
1814 sub file_type_long {
1815         my $mode = shift;
1816
1817         if ($mode !~ m/^[0-7]+$/) {
1818                 return $mode;
1819         } else {
1820                 $mode = oct $mode;
1821         }
1822
1823         if (S_ISGITLINK($mode)) {
1824                 return "submodule";
1825         } elsif (S_ISDIR($mode & S_IFMT)) {
1826                 return "directory";
1827         } elsif (S_ISLNK($mode)) {
1828                 return "symlink";
1829         } elsif (S_ISREG($mode)) {
1830                 if ($mode & S_IXUSR) {
1831                         return "executable";
1832                 } else {
1833                         return "file";
1834                 };
1835         } else {
1836                 return "unknown";
1837         }
1838 }
1839
1840
1841 ## ----------------------------------------------------------------------
1842 ## functions returning short HTML fragments, or transforming HTML fragments
1843 ## which don't belong to other sections
1844
1845 # format line of commit message.
1846 sub format_log_line_html {
1847         my $line = shift;
1848
1849         $line = esc_html($line, -nbsp=>1);
1850         $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1851                 $cgi->a({-href => href(action=>"object", hash=>$1),
1852                                         -class => "text"}, $1);
1853         }eg;
1854
1855         return $line;
1856 }
1857
1858 # format marker of refs pointing to given object
1859
1860 # the destination action is chosen based on object type and current context:
1861 # - for annotated tags, we choose the tag view unless it's the current view
1862 #   already, in which case we go to shortlog view
1863 # - for other refs, we keep the current view if we're in history, shortlog or
1864 #   log view, and select shortlog otherwise
1865 sub format_ref_marker {
1866         my ($refs, $id) = @_;
1867         my $markers = '';
1868
1869         if (defined $refs->{$id}) {
1870                 foreach my $ref (@{$refs->{$id}}) {
1871                         # this code exploits the fact that non-lightweight tags are the
1872                         # only indirect objects, and that they are the only objects for which
1873                         # we want to use tag instead of shortlog as action
1874                         my ($type, $name) = qw();
1875                         my $indirect = ($ref =~ s/\^\{\}$//);
1876                         # e.g. tags/v2.6.11 or heads/next
1877                         if ($ref =~ m!^(.*?)s?/(.*)$!) {
1878                                 $type = $1;
1879                                 $name = $2;
1880                         } else {
1881                                 $type = "ref";
1882                                 $name = $ref;
1883                         }
1884
1885                         my $class = $type;
1886                         $class .= " indirect" if $indirect;
1887
1888                         my $dest_action = "shortlog";
1889
1890                         if ($indirect) {
1891                                 $dest_action = "tag" unless $action eq "tag";
1892                         } elsif ($action =~ /^(history|(short)?log)$/) {
1893                                 $dest_action = $action;
1894                         }
1895
1896                         my $dest = "";
1897                         $dest .= "refs/" unless $ref =~ m!^refs/!;
1898                         $dest .= $ref;
1899
1900                         my $link = $cgi->a({
1901                                 -href => href(
1902                                         action=>$dest_action,
1903                                         hash=>$dest
1904                                 )}, $name);
1905
1906                         $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
1907                                 $link . "</span>";
1908                 }
1909         }
1910
1911         if ($markers) {
1912                 return ' <span class="refs">'. $markers . '</span>';
1913         } else {
1914                 return "";
1915         }
1916 }
1917
1918 # format, perhaps shortened and with markers, title line
1919 sub format_subject_html {
1920         my ($long, $short, $href, $extra) = @_;
1921         $extra = '' unless defined($extra);
1922
1923         if (length($short) < length($long)) {
1924                 $long =~ s/[[:cntrl:]]/?/g;
1925                 return $cgi->a({-href => $href, -class => "list subject",
1926                                 -title => to_utf8($long)},
1927                        esc_html($short)) . $extra;
1928         } else {
1929                 return $cgi->a({-href => $href, -class => "list subject"},
1930                        esc_html($long)) . $extra;
1931         }
1932 }
1933
1934 # Rather than recomputing the url for an email multiple times, we cache it
1935 # after the first hit. This gives a visible benefit in views where the avatar
1936 # for the same email is used repeatedly (e.g. shortlog).
1937 # The cache is shared by all avatar engines (currently gravatar only), which
1938 # are free to use it as preferred. Since only one avatar engine is used for any
1939 # given page, there's no risk for cache conflicts.
1940 our %avatar_cache = ();
1941
1942 # Compute the picon url for a given email, by using the picon search service over at
1943 # http://www.cs.indiana.edu/picons/search.html
1944 sub picon_url {
1945         my $email = lc shift;
1946         if (!$avatar_cache{$email}) {
1947                 my ($user, $domain) = split('@', $email);
1948                 $avatar_cache{$email} =
1949                         "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1950                         "$domain/$user/" .
1951                         "users+domains+unknown/up/single";
1952         }
1953         return $avatar_cache{$email};
1954 }
1955
1956 # Compute the gravatar url for a given email, if it's not in the cache already.
1957 # Gravatar stores only the part of the URL before the size, since that's the
1958 # one computationally more expensive. This also allows reuse of the cache for
1959 # different sizes (for this particular engine).
1960 sub gravatar_url {
1961         my $email = lc shift;
1962         my $size = shift;
1963         $avatar_cache{$email} ||=
1964                 "http://www.gravatar.com/avatar/" .
1965                         Digest::MD5::md5_hex($email) . "?s=";
1966         return $avatar_cache{$email} . $size;
1967 }
1968
1969 # Insert an avatar for the given $email at the given $size if the feature
1970 # is enabled.
1971 sub git_get_avatar {
1972         my ($email, %opts) = @_;
1973         my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1974         my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1975         $opts{-size} ||= 'default';
1976         my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1977         my $url = "";
1978         if ($git_avatar eq 'gravatar') {
1979                 $url = gravatar_url($email, $size);
1980         } elsif ($git_avatar eq 'picon') {
1981                 $url = picon_url($email);
1982         }
1983         # Other providers can be added by extending the if chain, defining $url
1984         # as needed. If no variant puts something in $url, we assume avatars
1985         # are completely disabled/unavailable.
1986         if ($url) {
1987                 return $pre_white .
1988                        "<img width=\"$size\" " .
1989                             "class=\"avatar\" " .
1990                             "src=\"".esc_url($url)."\" " .
1991                             "alt=\"\" " .
1992                        "/>" . $post_white;
1993         } else {
1994                 return "";
1995         }
1996 }
1997
1998 sub format_search_author {
1999         my ($author, $searchtype, $displaytext) = @_;
2000         my $have_search = gitweb_check_feature('search');
2001
2002         if ($have_search) {
2003                 my $performed = "";
2004                 if ($searchtype eq 'author') {
2005                         $performed = "authored";
2006                 } elsif ($searchtype eq 'committer') {
2007                         $performed = "committed";
2008                 }
2009
2010                 return $cgi->a({-href => href(action=>"search", hash=>$hash,
2011                                 searchtext=>$author,
2012                                 searchtype=>$searchtype), class=>"list",
2013                                 title=>"Search for commits $performed by $author"},
2014                                 $displaytext);
2015
2016         } else {
2017                 return $displaytext;
2018         }
2019 }
2020
2021 # format the author name of the given commit with the given tag
2022 # the author name is chopped and escaped according to the other
2023 # optional parameters (see chop_str).
2024 sub format_author_html {
2025         my $tag = shift;
2026         my $co = shift;
2027         my $author = chop_and_escape_str($co->{'author_name'}, @_);
2028         return "<$tag class=\"author\">" .
2029                format_search_author($co->{'author_name'}, "author",
2030                        git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2031                        $author) .
2032                "</$tag>";
2033 }
2034
2035 # format git diff header line, i.e. "diff --(git|combined|cc) ..."
2036 sub format_git_diff_header_line {
2037         my $line = shift;
2038         my $diffinfo = shift;
2039         my ($from, $to) = @_;
2040
2041         if ($diffinfo->{'nparents'}) {
2042                 # combined diff
2043                 $line =~ s!^(diff (.*?) )"?.*$!$1!;
2044                 if ($to->{'href'}) {
2045                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2046                                          esc_path($to->{'file'}));
2047                 } else { # file was deleted (no href)
2048                         $line .= esc_path($to->{'file'});
2049                 }
2050         } else {
2051                 # "ordinary" diff
2052                 $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2053                 if ($from->{'href'}) {
2054                         $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2055                                          'a/' . esc_path($from->{'file'}));
2056                 } else { # file was added (no href)
2057                         $line .= 'a/' . esc_path($from->{'file'});
2058                 }
2059                 $line .= ' ';
2060                 if ($to->{'href'}) {
2061                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2062                                          'b/' . esc_path($to->{'file'}));
2063                 } else { # file was deleted
2064                         $line .= 'b/' . esc_path($to->{'file'});
2065                 }
2066         }
2067
2068         return "<div class=\"diff header\">$line</div>\n";
2069 }
2070
2071 # format extended diff header line, before patch itself
2072 sub format_extended_diff_header_line {
2073         my $line = shift;
2074         my $diffinfo = shift;
2075         my ($from, $to) = @_;
2076
2077         # match <path>
2078         if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2079                 $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2080                                        esc_path($from->{'file'}));
2081         }
2082         if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2083                 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2084                                  esc_path($to->{'file'}));
2085         }
2086         # match single <mode>
2087         if ($line =~ m/\s(\d{6})$/) {
2088                 $line .= '<span class="info"> (' .
2089                          file_type_long($1) .
2090                          ')</span>';
2091         }
2092         # match <hash>
2093         if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2094                 # can match only for combined diff
2095                 $line = 'index ';
2096                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2097                         if ($from->{'href'}[$i]) {
2098                                 $line .= $cgi->a({-href=>$from->{'href'}[$i],
2099                                                   -class=>"hash"},
2100                                                  substr($diffinfo->{'from_id'}[$i],0,7));
2101                         } else {
2102                                 $line .= '0' x 7;
2103                         }
2104                         # separator
2105                         $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2106                 }
2107                 $line .= '..';
2108                 if ($to->{'href'}) {
2109                         $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2110                                          substr($diffinfo->{'to_id'},0,7));
2111                 } else {
2112                         $line .= '0' x 7;
2113                 }
2114
2115         } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2116                 # can match only for ordinary diff
2117                 my ($from_link, $to_link);
2118                 if ($from->{'href'}) {
2119                         $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2120                                              substr($diffinfo->{'from_id'},0,7));
2121                 } else {
2122                         $from_link = '0' x 7;
2123                 }
2124                 if ($to->{'href'}) {
2125                         $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2126                                            substr($diffinfo->{'to_id'},0,7));
2127                 } else {
2128                         $to_link = '0' x 7;
2129                 }
2130                 my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2131                 $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2132         }
2133
2134         return $line . "<br/>\n";
2135 }
2136
2137 # format from-file/to-file diff header
2138 sub format_diff_from_to_header {
2139         my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2140         my $line;
2141         my $result = '';
2142
2143         $line = $from_line;
2144         #assert($line =~ m/^---/) if DEBUG;
2145         # no extra formatting for "^--- /dev/null"
2146         if (! $diffinfo->{'nparents'}) {
2147                 # ordinary (single parent) diff
2148                 if ($line =~ m!^--- "?a/!) {
2149                         if ($from->{'href'}) {
2150                                 $line = '--- a/' .
2151                                         $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2152                                                 esc_path($from->{'file'}));
2153                         } else {
2154                                 $line = '--- a/' .
2155                                         esc_path($from->{'file'});
2156                         }
2157                 }
2158                 $result .= qq!<div class="diff from_file">$line</div>\n!;
2159
2160         } else {
2161                 # combined diff (merge commit)
2162                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2163                         if ($from->{'href'}[$i]) {
2164                                 $line = '--- ' .
2165                                         $cgi->a({-href=>href(action=>"blobdiff",
2166                                                              hash_parent=>$diffinfo->{'from_id'}[$i],
2167                                                              hash_parent_base=>$parents[$i],
2168                                                              file_parent=>$from->{'file'}[$i],
2169                                                              hash=>$diffinfo->{'to_id'},
2170                                                              hash_base=>$hash,
2171                                                              file_name=>$to->{'file'}),
2172                                                  -class=>"path",
2173                                                  -title=>"diff" . ($i+1)},
2174                                                 $i+1) .
2175                                         '/' .
2176                                         $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2177                                                 esc_path($from->{'file'}[$i]));
2178                         } else {
2179                                 $line = '--- /dev/null';
2180                         }
2181                         $result .= qq!<div class="diff from_file">$line</div>\n!;
2182                 }
2183         }
2184
2185         $line = $to_line;
2186         #assert($line =~ m/^\+\+\+/) if DEBUG;
2187         # no extra formatting for "^+++ /dev/null"
2188         if ($line =~ m!^\+\+\+ "?b/!) {
2189                 if ($to->{'href'}) {
2190                         $line = '+++ b/' .
2191                                 $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2192                                         esc_path($to->{'file'}));
2193                 } else {
2194                         $line = '+++ b/' .
2195                                 esc_path($to->{'file'});
2196                 }
2197         }
2198         $result .= qq!<div class="diff to_file">$line</div>\n!;
2199
2200         return $result;
2201 }
2202
2203 # create note for patch simplified by combined diff
2204 sub format_diff_cc_simplified {
2205         my ($diffinfo, @parents) = @_;
2206         my $result = '';
2207
2208         $result .= "<div class=\"diff header\">" .
2209                    "diff --cc ";
2210         if (!is_deleted($diffinfo)) {
2211                 $result .= $cgi->a({-href => href(action=>"blob",
2212                                                   hash_base=>$hash,
2213                                                   hash=>$diffinfo->{'to_id'},
2214                                                   file_name=>$diffinfo->{'to_file'}),
2215                                     -class => "path"},
2216                                    esc_path($diffinfo->{'to_file'}));
2217         } else {
2218                 $result .= esc_path($diffinfo->{'to_file'});
2219         }
2220         $result .= "</div>\n" . # class="diff header"
2221                    "<div class=\"diff nodifferences\">" .
2222                    "Simple merge" .
2223                    "</div>\n"; # class="diff nodifferences"
2224
2225         return $result;
2226 }
2227
2228 # format patch (diff) line (not to be used for diff headers)
2229 sub format_diff_line {
2230         my $line = shift;
2231         my ($from, $to) = @_;
2232         my $diff_class = "";
2233
2234         chomp $line;
2235
2236         if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2237                 # combined diff
2238                 my $prefix = substr($line, 0, scalar @{$from->{'href'}});
2239                 if ($line =~ m/^\@{3}/) {
2240                         $diff_class = " chunk_header";
2241                 } elsif ($line =~ m/^\\/) {
2242                         $diff_class = " incomplete";
2243                 } elsif ($prefix =~ tr/+/+/) {
2244                         $diff_class = " add";
2245                 } elsif ($prefix =~ tr/-/-/) {
2246                         $diff_class = " rem";
2247                 }
2248         } else {
2249                 # assume ordinary diff
2250                 my $char = substr($line, 0, 1);
2251                 if ($char eq '+') {
2252                         $diff_class = " add";
2253                 } elsif ($char eq '-') {
2254                         $diff_class = " rem";
2255                 } elsif ($char eq '@') {
2256                         $diff_class = " chunk_header";
2257                 } elsif ($char eq "\\") {
2258                         $diff_class = " incomplete";
2259                 }
2260         }
2261         $line = untabify($line);
2262         if ($from && $to && $line =~ m/^\@{2} /) {
2263                 my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2264                         $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2265
2266                 $from_lines = 0 unless defined $from_lines;
2267                 $to_lines   = 0 unless defined $to_lines;
2268
2269                 if ($from->{'href'}) {
2270                         $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2271                                              -class=>"list"}, $from_text);
2272                 }
2273                 if ($to->{'href'}) {
2274                         $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2275                                              -class=>"list"}, $to_text);
2276                 }
2277                 $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2278                         "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2279                 return "<div class=\"diff$diff_class\">$line</div>\n";
2280         } elsif ($from && $to && $line =~ m/^\@{3}/) {
2281                 my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2282                 my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2283
2284                 @from_text = split(' ', $ranges);
2285                 for (my $i = 0; $i < @from_text; ++$i) {
2286                         ($from_start[$i], $from_nlines[$i]) =
2287                                 (split(',', substr($from_text[$i], 1)), 0);
2288                 }
2289
2290                 $to_text   = pop @from_text;
2291                 $to_start  = pop @from_start;
2292                 $to_nlines = pop @from_nlines;
2293
2294                 $line = "<span class=\"chunk_info\">$prefix ";
2295                 for (my $i = 0; $i < @from_text; ++$i) {
2296                         if ($from->{'href'}[$i]) {
2297                                 $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2298                                                   -class=>"list"}, $from_text[$i]);
2299                         } else {
2300                                 $line .= $from_text[$i];
2301                         }
2302                         $line .= " ";
2303                 }
2304                 if ($to->{'href'}) {
2305                         $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2306                                           -class=>"list"}, $to_text);
2307                 } else {
2308                         $line .= $to_text;
2309                 }
2310                 $line .= " $prefix</span>" .
2311                          "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2312                 return "<div class=\"diff$diff_class\">$line</div>\n";
2313         }
2314         return "<div class=\"diff$diff_class\">" . esc_html($line, -nbsp=>1) . "</div>\n";
2315 }
2316
2317 # Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2318 # linked.  Pass the hash of the tree/commit to snapshot.
2319 sub format_snapshot_links {
2320         my ($hash) = @_;
2321         my $num_fmts = @snapshot_fmts;
2322         if ($num_fmts > 1) {
2323                 # A parenthesized list of links bearing format names.
2324                 # e.g. "snapshot (_tar.gz_ _zip_)"
2325                 return "snapshot (" . join(' ', map
2326                         $cgi->a({
2327                                 -href => href(
2328                                         action=>"snapshot",
2329                                         hash=>$hash,
2330                                         snapshot_format=>$_
2331                                 )
2332                         }, $known_snapshot_formats{$_}{'display'})
2333                 , @snapshot_fmts) . ")";
2334         } elsif ($num_fmts == 1) {
2335                 # A single "snapshot" link whose tooltip bears the format name.
2336                 # i.e. "_snapshot_"
2337                 my ($fmt) = @snapshot_fmts;
2338                 return
2339                         $cgi->a({
2340                                 -href => href(
2341                                         action=>"snapshot",
2342                                         hash=>$hash,
2343                                         snapshot_format=>$fmt
2344                                 ),
2345                                 -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2346                         }, "snapshot");
2347         } else { # $num_fmts == 0
2348                 return undef;
2349         }
2350 }
2351
2352 ## ......................................................................
2353 ## functions returning values to be passed, perhaps after some
2354 ## transformation, to other functions; e.g. returning arguments to href()
2355
2356 # returns hash to be passed to href to generate gitweb URL
2357 # in -title key it returns description of link
2358 sub get_feed_info {
2359         my $format = shift || 'Atom';
2360         my %res = (action => lc($format));
2361
2362         # feed links are possible only for project views
2363         return unless (defined $project);
2364         # some views should link to OPML, or to generic project feed,
2365         # or don't have specific feed yet (so they should use generic)
2366         return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2367
2368         my $branch;
2369         # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2370         # from tag links; this also makes possible to detect branch links
2371         if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2372             (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2373                 $branch = $1;
2374         }
2375         # find log type for feed description (title)
2376         my $type = 'log';
2377         if (defined $file_name) {
2378                 $type  = "history of $file_name";
2379                 $type .= "/" if ($action eq 'tree');
2380                 $type .= " on '$branch'" if (defined $branch);
2381         } else {
2382                 $type = "log of $branch" if (defined $branch);
2383         }
2384
2385         $res{-title} = $type;
2386         $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2387         $res{'file_name'} = $file_name;
2388
2389         return %res;
2390 }
2391
2392 ## ----------------------------------------------------------------------
2393 ## git utility subroutines, invoking git commands
2394
2395 # returns path to the core git executable and the --git-dir parameter as list
2396 sub git_cmd {
2397         $number_of_git_cmds++;
2398         return $GIT, '--git-dir='.$git_dir;
2399 }
2400
2401 # quote the given arguments for passing them to the shell
2402 # quote_command("command", "arg 1", "arg with ' and ! characters")
2403 # => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2404 # Try to avoid using this function wherever possible.
2405 sub quote_command {
2406         return join(' ',
2407                 map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2408 }
2409
2410 # get HEAD ref of given project as hash
2411 sub git_get_head_hash {
2412         return git_get_full_hash(shift, 'HEAD');
2413 }
2414
2415 sub git_get_full_hash {
2416         return git_get_hash(@_);
2417 }
2418
2419 sub git_get_short_hash {
2420         return git_get_hash(@_, '--short=7');
2421 }
2422
2423 sub git_get_hash {
2424         my ($project, $hash, @options) = @_;
2425         my $o_git_dir = $git_dir;
2426         my $retval = undef;
2427         $git_dir = "$projectroot/$project";
2428         if (open my $fd, '-|', git_cmd(), 'rev-parse',
2429             '--verify', '-q', @options, $hash) {
2430                 $retval = <$fd>;
2431                 chomp $retval if defined $retval;
2432                 close $fd;
2433         }
2434         if (defined $o_git_dir) {
2435                 $git_dir = $o_git_dir;
2436         }
2437         return $retval;
2438 }
2439
2440 # get type of given object
2441 sub git_get_type {
2442         my $hash = shift;
2443
2444         open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2445         my $type = <$fd>;
2446         close $fd or return;
2447         chomp $type;
2448         return $type;
2449 }
2450
2451 # repository configuration
2452 our $config_file = '';
2453 our %config;
2454
2455 # store multiple values for single key as anonymous array reference
2456 # single values stored directly in the hash, not as [ <value> ]
2457 sub hash_set_multi {
2458         my ($hash, $key, $value) = @_;
2459
2460         if (!exists $hash->{$key}) {
2461                 $hash->{$key} = $value;
2462         } elsif (!ref $hash->{$key}) {
2463                 $hash->{$key} = [ $hash->{$key}, $value ];
2464         } else {
2465                 push @{$hash->{$key}}, $value;
2466         }
2467 }
2468
2469 # return hash of git project configuration
2470 # optionally limited to some section, e.g. 'gitweb'
2471 sub git_parse_project_config {
2472         my $section_regexp = shift;
2473         my %config;
2474
2475         local $/ = "\0";
2476
2477         open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2478                 or return;
2479
2480         while (my $keyval = <$fh>) {
2481                 chomp $keyval;
2482                 my ($key, $value) = split(/\n/, $keyval, 2);
2483
2484                 hash_set_multi(\%config, $key, $value)
2485                         if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2486         }
2487         close $fh;
2488
2489         return %config;
2490 }
2491
2492 # convert config value to boolean: 'true' or 'false'
2493 # no value, number > 0, 'true' and 'yes' values are true
2494 # rest of values are treated as false (never as error)
2495 sub config_to_bool {
2496         my $val = shift;
2497
2498         return 1 if !defined $val;             # section.key
2499
2500         # strip leading and trailing whitespace
2501         $val =~ s/^\s+//;
2502         $val =~ s/\s+$//;
2503
2504         return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2505                 ($val =~ /^(?:true|yes)$/i));  # section.key = true
2506 }
2507
2508 # convert config value to simple decimal number
2509 # an optional value suffix of 'k', 'm', or 'g' will cause the value
2510 # to be multiplied by 1024, 1048576, or 1073741824
2511 sub config_to_int {
2512         my $val = shift;
2513
2514         # strip leading and trailing whitespace
2515         $val =~ s/^\s+//;
2516         $val =~ s/\s+$//;
2517
2518         if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2519                 $unit = lc($unit);
2520                 # unknown unit is treated as 1
2521                 return $num * ($unit eq 'g' ? 1073741824 :
2522                                $unit eq 'm' ?    1048576 :
2523                                $unit eq 'k' ?       1024 : 1);
2524         }
2525         return $val;
2526 }
2527
2528 # convert config value to array reference, if needed
2529 sub config_to_multi {
2530         my $val = shift;
2531
2532         return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2533 }
2534
2535 sub git_get_project_config {
2536         my ($key, $type) = @_;
2537
2538         return unless defined $git_dir;
2539
2540         # key sanity check
2541         return unless ($key);
2542         # only subsection, if exists, is case sensitive,
2543         # and not lowercased by 'git config -z -l'
2544         if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2545                 $key = join(".", lc($hi), $mi, lc($lo));
2546         } else {
2547                 $key = lc($key);
2548         }
2549         $key =~ s/^gitweb\.//;
2550         return if ($key =~ m/\W/);
2551
2552         # type sanity check
2553         if (defined $type) {
2554                 $type =~ s/^--//;
2555                 $type = undef
2556                         unless ($type eq 'bool' || $type eq 'int');
2557         }
2558
2559         # get config
2560         if (!defined $config_file ||
2561             $config_file ne "$git_dir/config") {
2562                 %config = git_parse_project_config('gitweb');
2563                 $config_file = "$git_dir/config";
2564         }
2565
2566         # check if config variable (key) exists
2567         return unless exists $config{"gitweb.$key"};
2568
2569         # ensure given type
2570         if (!defined $type) {
2571                 return $config{"gitweb.$key"};
2572         } elsif ($type eq 'bool') {
2573                 # backward compatibility: 'git config --bool' returns true/false
2574                 return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2575         } elsif ($type eq 'int') {
2576                 return config_to_int($config{"gitweb.$key"});
2577         }
2578         return $config{"gitweb.$key"};
2579 }
2580
2581 # get hash of given path at given ref
2582 sub git_get_hash_by_path {
2583         my $base = shift;
2584         my $path = shift || return undef;
2585         my $type = shift;
2586
2587         $path =~ s,/+$,,;
2588
2589         open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2590                 or die_error(500, "Open git-ls-tree failed");
2591         my $line = <$fd>;
2592         close $fd or return undef;
2593
2594         if (!defined $line) {
2595                 # there is no tree or hash given by $path at $base
2596                 return undef;
2597         }
2598
2599         #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2600         $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2601         if (defined $type && $type ne $2) {
2602                 # type doesn't match
2603                 return undef;
2604         }
2605         return $3;
2606 }
2607
2608 # get path of entry with given hash at given tree-ish (ref)
2609 # used to get 'from' filename for combined diff (merge commit) for renames
2610 sub git_get_path_by_hash {
2611         my $base = shift || return;
2612         my $hash = shift || return;
2613
2614         local $/ = "\0";
2615
2616         open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2617                 or return undef;
2618         while (my $line = <$fd>) {
2619                 chomp $line;
2620
2621                 #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2622                 #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2623                 if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2624                         close $fd;
2625                         return $1;
2626                 }
2627         }
2628         close $fd;
2629         return undef;
2630 }
2631
2632 ## ......................................................................
2633 ## git utility functions, directly accessing git repository
2634
2635 # get the value of config variable either from file named as the variable
2636 # itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2637 # configuration variable in the repository config file.
2638 sub git_get_file_or_project_config {
2639         my ($path, $name) = @_;
2640
2641         $git_dir = "$projectroot/$path";
2642         open my $fd, '<', "$git_dir/$name"
2643                 or return git_get_project_config($name);
2644         my $conf = <$fd>;
2645         close $fd;
2646         if (defined $conf) {
2647                 chomp $conf;
2648         }
2649         return $conf;
2650 }
2651
2652 sub git_get_project_description {
2653         my $path = shift;
2654         return git_get_file_or_project_config($path, 'description');
2655 }
2656
2657 sub git_get_project_category {
2658         my $path = shift;
2659         return git_get_file_or_project_config($path, 'category');
2660 }
2661
2662
2663 # supported formats:
2664 # * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2665 #   - if its contents is a number, use it as tag weight,
2666 #   - otherwise add a tag with weight 1
2667 # * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2668 #   the same value multiple times increases tag weight
2669 # * `gitweb.ctag' multi-valued repo config variable
2670 sub git_get_project_ctags {
2671         my $project = shift;
2672         my $ctags = {};
2673
2674         $git_dir = "$projectroot/$project";
2675         if (opendir my $dh, "$git_dir/ctags") {
2676                 my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2677                 foreach my $tagfile (@files) {
2678                         open my $ct, '<', $tagfile
2679                                 or next;
2680                         my $val = <$ct>;
2681                         chomp $val if $val;
2682                         close $ct;
2683
2684                         (my $ctag = $tagfile) =~ s#.*/##;
2685                         if ($val =~ /^\d+$/) {
2686                                 $ctags->{$ctag} = $val;
2687                         } else {
2688                                 $ctags->{$ctag} = 1;
2689                         }
2690                 }
2691                 closedir $dh;
2692
2693         } elsif (open my $fh, '<', "$git_dir/ctags") {
2694                 while (my $line = <$fh>) {
2695                         chomp $line;
2696                         $ctags->{$line}++ if $line;
2697                 }
2698                 close $fh;
2699
2700         } else {
2701                 my $taglist = config_to_multi(git_get_project_config('ctag'));
2702                 foreach my $tag (@$taglist) {
2703                         $ctags->{$tag}++;
2704                 }
2705         }
2706
2707         return $ctags;
2708 }
2709
2710 # return hash, where keys are content tags ('ctags'),
2711 # and values are sum of weights of given tag in every project
2712 sub git_gather_all_ctags {
2713         my $projects = shift;
2714         my $ctags = {};
2715
2716         foreach my $p (@$projects) {
2717                 foreach my $ct (keys %{$p->{'ctags'}}) {
2718                         $ctags->{$ct} += $p->{'ctags'}->{$ct};
2719                 }
2720         }
2721
2722         return $ctags;
2723 }
2724
2725 sub git_populate_project_tagcloud {
2726         my $ctags = shift;
2727
2728         # First, merge different-cased tags; tags vote on casing
2729         my %ctags_lc;
2730         foreach (keys %$ctags) {
2731                 $ctags_lc{lc $_}->{count} += $ctags->{$_};
2732                 if (not $ctags_lc{lc $_}->{topcount}
2733                     or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2734                         $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2735                         $ctags_lc{lc $_}->{topname} = $_;
2736                 }
2737         }
2738
2739         my $cloud;
2740         my $matched = $cgi->param('by_tag');
2741         if (eval { require HTML::TagCloud; 1; }) {
2742                 $cloud = HTML::TagCloud->new;
2743                 foreach my $ctag (sort keys %ctags_lc) {
2744                         # Pad the title with spaces so that the cloud looks
2745                         # less crammed.
2746                         my $title = esc_html($ctags_lc{$ctag}->{topname});
2747                         $title =~ s/ /&nbsp;/g;
2748                         $title =~ s/^/&nbsp;/g;
2749                         $title =~ s/$/&nbsp;/g;
2750                         if (defined $matched && $matched eq $ctag) {
2751                                 $title = qq(<span class="match">$title</span>);
2752                         }
2753                         $cloud->add($title, href(project=>undef, ctag=>$ctag),
2754                                     $ctags_lc{$ctag}->{count});
2755                 }
2756         } else {
2757                 $cloud = {};
2758                 foreach my $ctag (keys %ctags_lc) {
2759                         my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2760                         if (defined $matched && $matched eq $ctag) {
2761                                 $title = qq(<span class="match">$title</span>);
2762                         }
2763                         $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2764                         $cloud->{$ctag}{ctag} =
2765                                 $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2766                 }
2767         }
2768         return $cloud;
2769 }
2770
2771 sub git_show_project_tagcloud {
2772         my ($cloud, $count) = @_;
2773         if (ref $cloud eq 'HTML::TagCloud') {
2774                 return $cloud->html_and_css($count);
2775         } else {
2776                 my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2777                 return
2778                         '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2779                         join (', ', map {
2780                                 $cloud->{$_}->{'ctag'}
2781                         } splice(@tags, 0, $count)) .
2782                         '</div>';
2783         }
2784 }
2785
2786 sub git_get_project_url_list {
2787         my $path = shift;
2788
2789         $git_dir = "$projectroot/$path";
2790         open my $fd, '<', "$git_dir/cloneurl"
2791                 or return wantarray ?
2792                 @{ config_to_multi(git_get_project_config('url')) } :
2793                    config_to_multi(git_get_project_config('url'));
2794         my @git_project_url_list = map { chomp; $_ } <$fd>;
2795         close $fd;
2796
2797         return wantarray ? @git_project_url_list : \@git_project_url_list;
2798 }
2799
2800 sub git_get_projects_list {
2801         my $filter = shift || '';
2802         my @list;
2803
2804         $filter =~ s/\.git$//;
2805
2806         if (-d $projects_list) {
2807                 # search in directory
2808                 my $dir = $projects_list;
2809                 # remove the trailing "/"
2810                 $dir =~ s!/+$!!;
2811                 my $pfxlen = length("$projects_list");
2812                 my $pfxdepth = ($projects_list =~ tr!/!!);
2813                 # when filtering, search only given subdirectory
2814                 if ($filter) {
2815                         $dir .= "/$filter";
2816                         $dir =~ s!/+$!!;
2817                 }
2818
2819                 File::Find::find({
2820                         follow_fast => 1, # follow symbolic links
2821                         follow_skip => 2, # ignore duplicates
2822                         dangling_symlinks => 0, # ignore dangling symlinks, silently
2823                         wanted => sub {
2824                                 # global variables
2825                                 our $project_maxdepth;
2826                                 our $projectroot;
2827                                 # skip project-list toplevel, if we get it.
2828                                 return if (m!^[/.]$!);
2829                                 # only directories can be git repositories
2830                                 return unless (-d $_);
2831                                 # don't traverse too deep (Find is super slow on os x)
2832                                 # $project_maxdepth excludes depth of $projectroot
2833                                 if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2834                                         $File::Find::prune = 1;
2835                                         return;
2836                                 }
2837
2838                                 my $path = substr($File::Find::name, $pfxlen + 1);
2839                                 # we check related file in $projectroot
2840                                 if (check_export_ok("$projectroot/$path")) {
2841                                         push @list, { path => $path };
2842                                         $File::Find::prune = 1;
2843                                 }
2844                         },
2845                 }, "$dir");
2846
2847         } elsif (-f $projects_list) {
2848                 # read from file(url-encoded):
2849                 # 'git%2Fgit.git Linus+Torvalds'
2850                 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2851                 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2852                 open my $fd, '<', $projects_list or return;
2853         PROJECT:
2854                 while (my $line = <$fd>) {
2855                         chomp $line;
2856                         my ($path, $owner) = split ' ', $line;
2857                         $path = unescape($path);
2858                         $owner = unescape($owner);
2859                         if (!defined $path) {
2860                                 next;
2861                         }
2862                         # if $filter is rpovided, check if $path begins with $filter
2863                         if ($filter && $path !~ m!^\Q$filter\E/!) {
2864                                 next;
2865                         }
2866                         if (check_export_ok("$projectroot/$path")) {
2867                                 my $pr = {
2868                                         path => $path,
2869                                         owner => to_utf8($owner),
2870                                 };
2871                                 push @list, $pr;
2872                         }
2873                 }
2874                 close $fd;
2875         }
2876         return @list;
2877 }
2878
2879 # written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
2880 # as side effects it sets 'forks' field to list of forks for forked projects
2881 sub filter_forks_from_projects_list {
2882         my $projects = shift;
2883
2884         my %trie; # prefix tree of directories (path components)
2885         # generate trie out of those directories that might contain forks
2886         foreach my $pr (@$projects) {
2887                 my $path = $pr->{'path'};
2888                 $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
2889                 next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
2890                 next unless ($path);      # skip '.git' repository: tests, git-instaweb
2891                 next unless (-d "$projectroot/$path"); # containing directory exists
2892                 $pr->{'forks'} = [];      # there can be 0 or more forks of project
2893
2894                 # add to trie
2895                 my @dirs = split('/', $path);
2896                 # walk the trie, until either runs out of components or out of trie
2897                 my $ref = \%trie;
2898                 while (scalar @dirs &&
2899                        exists($ref->{$dirs[0]})) {
2900                         $ref = $ref->{shift @dirs};
2901                 }
2902                 # create rest of trie structure from rest of components
2903                 foreach my $dir (@dirs) {
2904                         $ref = $ref->{$dir} = {};
2905                 }
2906                 # create end marker, store $pr as a data
2907                 $ref->{''} = $pr if (!exists $ref->{''});
2908         }
2909
2910         # filter out forks, by finding shortest prefix match for paths
2911         my @filtered;
2912  PROJECT:
2913         foreach my $pr (@$projects) {
2914                 # trie lookup
2915                 my $ref = \%trie;
2916         DIR:
2917                 foreach my $dir (split('/', $pr->{'path'})) {
2918                         if (exists $ref->{''}) {
2919                                 # found [shortest] prefix, is a fork - skip it
2920                                 push @{$ref->{''}{'forks'}}, $pr;
2921                                 next PROJECT;
2922                         }
2923                         if (!exists $ref->{$dir}) {
2924                                 # not in trie, cannot have prefix, not a fork
2925                                 push @filtered, $pr;
2926                                 next PROJECT;
2927                         }
2928                         # If the dir is there, we just walk one step down the trie.
2929                         $ref = $ref->{$dir};
2930                 }
2931                 # we ran out of trie
2932                 # (shouldn't happen: it's either no match, or end marker)
2933                 push @filtered, $pr;
2934         }
2935
2936         return @filtered;
2937 }
2938
2939 # note: fill_project_list_info must be run first,
2940 # for 'descr_long' and 'ctags' to be filled
2941 sub search_projects_list {
2942         my ($projlist, %opts) = @_;
2943         my $tagfilter  = $opts{'tagfilter'};
2944         my $searchtext = $opts{'searchtext'};
2945
2946         return @$projlist
2947                 unless ($tagfilter || $searchtext);
2948
2949         my @projects;
2950  PROJECT:
2951         foreach my $pr (@$projlist) {
2952
2953                 if ($tagfilter) {
2954                         next unless ref($pr->{'ctags'}) eq 'HASH';
2955                         next unless
2956                                 grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
2957                 }
2958
2959                 if ($searchtext) {
2960                         next unless
2961                                 $pr->{'path'} =~ /$searchtext/ ||
2962                                 $pr->{'descr_long'} =~ /$searchtext/;
2963                 }
2964
2965                 push @projects, $pr;
2966         }
2967
2968         return @projects;
2969 }
2970
2971 our $gitweb_project_owner = undef;
2972 sub git_get_project_list_from_file {
2973
2974         return if (defined $gitweb_project_owner);
2975
2976         $gitweb_project_owner = {};
2977         # read from file (url-encoded):
2978         # 'git%2Fgit.git Linus+Torvalds'
2979         # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2980         # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2981         if (-f $projects_list) {
2982                 open(my $fd, '<', $projects_list);
2983                 while (my $line = <$fd>) {
2984                         chomp $line;
2985                         my ($pr, $ow) = split ' ', $line;
2986                         $pr = unescape($pr);
2987                         $ow = unescape($ow);
2988                         $gitweb_project_owner->{$pr} = to_utf8($ow);
2989                 }
2990                 close $fd;
2991         }
2992 }
2993
2994 sub git_get_project_owner {
2995         my $project = shift;
2996         my $owner;
2997
2998         return undef unless $project;
2999         $git_dir = "$projectroot/$project";
3000
3001         if (!defined $gitweb_project_owner) {
3002                 git_get_project_list_from_file();
3003         }
3004
3005         if (exists $gitweb_project_owner->{$project}) {
3006                 $owner = $gitweb_project_owner->{$project};
3007         }
3008         if (!defined $owner){
3009                 $owner = git_get_project_config('owner');
3010         }
3011         if (!defined $owner) {
3012                 $owner = get_file_owner("$git_dir");
3013         }
3014
3015         return $owner;
3016 }
3017
3018 sub git_get_last_activity {
3019         my ($path) = @_;
3020         my $fd;
3021
3022         $git_dir = "$projectroot/$path";
3023         open($fd, "-|", git_cmd(), 'for-each-ref',
3024              '--format=%(committer)',
3025              '--sort=-committerdate',
3026              '--count=1',
3027              'refs/heads') or return;
3028         my $most_recent = <$fd>;
3029         close $fd or return;
3030         if (defined $most_recent &&
3031             $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3032                 my $timestamp = $1;
3033                 my $age = time - $timestamp;
3034                 return ($age, age_string($age));
3035         }
3036         return (undef, undef);
3037 }
3038
3039 # Implementation note: when a single remote is wanted, we cannot use 'git
3040 # remote show -n' because that command always work (assuming it's a remote URL
3041 # if it's not defined), and we cannot use 'git remote show' because that would
3042 # try to make a network roundtrip. So the only way to find if that particular
3043 # remote is defined is to walk the list provided by 'git remote -v' and stop if
3044 # and when we find what we want.
3045 sub git_get_remotes_list {
3046         my $wanted = shift;
3047         my %remotes = ();
3048
3049         open my $fd, '-|' , git_cmd(), 'remote', '-v';
3050         return unless $fd;
3051         while (my $remote = <$fd>) {
3052                 chomp $remote;
3053                 $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3054                 next if $wanted and not $remote eq $wanted;
3055                 my ($url, $key) = ($1, $2);
3056
3057                 $remotes{$remote} ||= { 'heads' => () };
3058                 $remotes{$remote}{$key} = $url;
3059         }
3060         close $fd or return;
3061         return wantarray ? %remotes : \%remotes;
3062 }
3063
3064 # Takes a hash of remotes as first parameter and fills it by adding the
3065 # available remote heads for each of the indicated remotes.
3066 sub fill_remote_heads {
3067         my $remotes = shift;
3068         my @heads = map { "remotes/$_" } keys %$remotes;
3069         my @remoteheads = git_get_heads_list(undef, @heads);
3070         foreach my $remote (keys %$remotes) {
3071                 $remotes->{$remote}{'heads'} = [ grep {
3072                         $_->{'name'} =~ s!^$remote/!!
3073                         } @remoteheads ];
3074         }
3075 }
3076
3077 sub git_get_references {
3078         my $type = shift || "";
3079         my %refs;
3080         # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3081         # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3082         open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3083                 ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3084                 or return;
3085
3086         while (my $line = <$fd>) {
3087                 chomp $line;
3088                 if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3089                         if (defined $refs{$1}) {
3090                                 push @{$refs{$1}}, $2;
3091                         } else {
3092                                 $refs{$1} = [ $2 ];
3093                         }
3094                 }
3095         }
3096         close $fd or return;
3097         return \%refs;
3098 }
3099
3100 sub git_get_rev_name_tags {
3101         my $hash = shift || return undef;
3102
3103         open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3104                 or return;
3105         my $name_rev = <$fd>;
3106         close $fd;
3107
3108         if ($name_rev =~ m|^$hash tags/(.*)$|) {
3109                 return $1;
3110         } else {
3111                 # catches also '$hash undefined' output
3112                 return undef;
3113         }
3114 }
3115
3116 ## ----------------------------------------------------------------------
3117 ## parse to hash functions
3118
3119 sub parse_date {
3120         my $epoch = shift;
3121         my $tz = shift || "-0000";
3122
3123         my %date;
3124         my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3125         my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3126         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3127         $date{'hour'} = $hour;
3128         $date{'minute'} = $min;
3129         $date{'mday'} = $mday;
3130         $date{'day'} = $days[$wday];
3131         $date{'month'} = $months[$mon];
3132         $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3133                              $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3134         $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3135                              $mday, $months[$mon], $hour ,$min;
3136         $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3137                              1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3138
3139         my ($tz_sign, $tz_hour, $tz_min) =
3140                 ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3141         $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3142         my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3143         ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3144         $date{'hour_local'} = $hour;
3145         $date{'minute_local'} = $min;
3146         $date{'tz_local'} = $tz;
3147         $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3148                                   1900+$year, $mon+1, $mday,
3149                                   $hour, $min, $sec, $tz);
3150         return %date;
3151 }
3152
3153 sub parse_tag {
3154         my $tag_id = shift;
3155         my %tag;
3156         my @comment;
3157
3158         open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3159         $tag{'id'} = $tag_id;
3160         while (my $line = <$fd>) {
3161                 chomp $line;
3162                 if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3163                         $tag{'object'} = $1;
3164                 } elsif ($line =~ m/^type (.+)$/) {
3165                         $tag{'type'} = $1;
3166                 } elsif ($line =~ m/^tag (.+)$/) {
3167                         $tag{'name'} = $1;
3168                 } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3169                         $tag{'author'} = $1;
3170                         $tag{'author_epoch'} = $2;
3171                         $tag{'author_tz'} = $3;
3172                         if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3173                                 $tag{'author_name'}  = $1;
3174                                 $tag{'author_email'} = $2;
3175                         } else {
3176                                 $tag{'author_name'} = $tag{'author'};
3177                         }
3178                 } elsif ($line =~ m/--BEGIN/) {
3179                         push @comment, $line;
3180                         last;
3181                 } elsif ($line eq "") {
3182                         last;
3183                 }
3184         }
3185         push @comment, <$fd>;
3186         $tag{'comment'} = \@comment;
3187         close $fd or return;
3188         if (!defined $tag{'name'}) {
3189                 return
3190         };
3191         return %tag
3192 }
3193
3194 sub parse_commit_text {
3195         my ($commit_text, $withparents) = @_;
3196         my @commit_lines = split '\n', $commit_text;
3197         my %co;
3198
3199         pop @commit_lines; # Remove '\0'
3200
3201         if (! @commit_lines) {
3202                 return;
3203         }
3204
3205         my $header = shift @commit_lines;
3206         if ($header !~ m/^[0-9a-fA-F]{40}/) {
3207                 return;
3208         }
3209         ($co{'id'}, my @parents) = split ' ', $header;
3210         while (my $line = shift @commit_lines) {
3211                 last if $line eq "\n";
3212                 if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3213                         $co{'tree'} = $1;
3214                 } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3215                         push @parents, $1;
3216                 } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3217                         $co{'author'} = to_utf8($1);
3218                         $co{'author_epoch'} = $2;
3219                         $co{'author_tz'} = $3;
3220                         if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3221                                 $co{'author_name'}  = $1;
3222                                 $co{'author_email'} = $2;
3223                         } else {
3224                                 $co{'author_name'} = $co{'author'};
3225                         }
3226                 } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3227                         $co{'committer'} = to_utf8($1);
3228                         $co{'committer_epoch'} = $2;
3229                         $co{'committer_tz'} = $3;
3230                         if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3231                                 $co{'committer_name'}  = $1;
3232                                 $co{'committer_email'} = $2;
3233                         } else {
3234                                 $co{'committer_name'} = $co{'committer'};
3235                         }
3236                 }
3237         }
3238         if (!defined $co{'tree'}) {
3239                 return;
3240         };
3241         $co{'parents'} = \@parents;
3242         $co{'parent'} = $parents[0];
3243
3244         foreach my $title (@commit_lines) {
3245                 $title =~ s/^    //;
3246                 if ($title ne "") {
3247                         $co{'title'} = chop_str($title, 80, 5);
3248                         # remove leading stuff of merges to make the interesting part visible
3249                         if (length($title) > 50) {
3250                                 $title =~ s/^Automatic //;
3251                                 $title =~ s/^merge (of|with) /Merge ... /i;
3252                                 if (length($title) > 50) {
3253                                         $title =~ s/(http|rsync):\/\///;
3254                                 }
3255                                 if (length($title) > 50) {
3256                                         $title =~ s/(master|www|rsync)\.//;
3257                                 }
3258                                 if (length($title) > 50) {
3259                                         $title =~ s/kernel.org:?//;
3260                                 }
3261                                 if (length($title) > 50) {
3262                                         $title =~ s/\/pub\/scm//;
3263                                 }
3264                         }
3265                         $co{'title_short'} = chop_str($title, 50, 5);
3266                         last;
3267                 }
3268         }
3269         if (! defined $co{'title'} || $co{'title'} eq "") {
3270                 $co{'title'} = $co{'title_short'} = '(no commit message)';
3271         }
3272         # remove added spaces
3273         foreach my $line (@commit_lines) {
3274                 $line =~ s/^    //;
3275         }
3276         $co{'comment'} = \@commit_lines;
3277
3278         my $age = time - $co{'committer_epoch'};
3279         $co{'age'} = $age;
3280         $co{'age_string'} = age_string($age);
3281         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3282         if ($age > 60*60*24*7*2) {
3283                 $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3284                 $co{'age_string_age'} = $co{'age_string'};
3285         } else {
3286                 $co{'age_string_date'} = $co{'age_string'};
3287                 $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3288         }
3289         return %co;
3290 }
3291
3292 sub parse_commit {
3293         my ($commit_id) = @_;
3294         my %co;
3295
3296         local $/ = "\0";
3297
3298         open my $fd, "-|", git_cmd(), "rev-list",
3299                 "--parents",
3300                 "--header",
3301                 "--max-count=1",
3302                 $commit_id,
3303                 "--",
3304                 or die_error(500, "Open git-rev-list failed");
3305         %co = parse_commit_text(<$fd>, 1);
3306         close $fd;
3307
3308         return %co;
3309 }
3310
3311 sub parse_commits {
3312         my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3313         my @cos;
3314
3315         $maxcount ||= 1;
3316         $skip ||= 0;
3317
3318         local $/ = "\0";
3319
3320         open my $fd, "-|", git_cmd(), "rev-list",
3321                 "--header",
3322                 @args,
3323                 ("--max-count=" . $maxcount),
3324                 ("--skip=" . $skip),
3325                 @extra_options,
3326                 $commit_id,
3327                 "--",
3328                 ($filename ? ($filename) : ())
3329                 or die_error(500, "Open git-rev-list failed");
3330         while (my $line = <$fd>) {
3331                 my %co = parse_commit_text($line);
3332                 push @cos, \%co;
3333         }
3334         close $fd;
3335
3336         return wantarray ? @cos : \@cos;
3337 }
3338
3339 # parse line of git-diff-tree "raw" output
3340 sub parse_difftree_raw_line {
3341         my $line = shift;
3342         my %res;
3343
3344         # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3345         # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3346         if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3347                 $res{'from_mode'} = $1;
3348                 $res{'to_mode'} = $2;
3349                 $res{'from_id'} = $3;
3350                 $res{'to_id'} = $4;
3351                 $res{'status'} = $5;
3352                 $res{'similarity'} = $6;
3353                 if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3354                         ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3355                 } else {
3356                         $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3357                 }
3358         }
3359         # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3360         # combined diff (for merge commit)
3361         elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3362                 $res{'nparents'}  = length($1);
3363                 $res{'from_mode'} = [ split(' ', $2) ];
3364                 $res{'to_mode'} = pop @{$res{'from_mode'}};
3365                 $res{'from_id'} = [ split(' ', $3) ];
3366                 $res{'to_id'} = pop @{$res{'from_id'}};
3367                 $res{'status'} = [ split('', $4) ];
3368                 $res{'to_file'} = unquote($5);
3369         }
3370         # 'c512b523472485aef4fff9e57b229d9d243c967f'
3371         elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3372                 $res{'commit'} = $1;
3373         }
3374
3375         return wantarray ? %res : \%res;
3376 }
3377
3378 # wrapper: return parsed line of git-diff-tree "raw" output
3379 # (the argument might be raw line, or parsed info)
3380 sub parsed_difftree_line {
3381         my $line_or_ref = shift;
3382
3383         if (ref($line_or_ref) eq "HASH") {
3384                 # pre-parsed (or generated by hand)
3385                 return $line_or_ref;
3386         } else {
3387                 return parse_difftree_raw_line($line_or_ref);
3388         }
3389 }
3390
3391 # parse line of git-ls-tree output
3392 sub parse_ls_tree_line {
3393         my $line = shift;
3394         my %opts = @_;
3395         my %res;
3396
3397         if ($opts{'-l'}) {
3398                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3399                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3400
3401                 $res{'mode'} = $1;
3402                 $res{'type'} = $2;
3403                 $res{'hash'} = $3;
3404                 $res{'size'} = $4;
3405                 if ($opts{'-z'}) {
3406                         $res{'name'} = $5;
3407                 } else {
3408                         $res{'name'} = unquote($5);
3409                 }
3410         } else {
3411                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3412                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3413
3414                 $res{'mode'} = $1;
3415                 $res{'type'} = $2;
3416                 $res{'hash'} = $3;
3417                 if ($opts{'-z'}) {
3418                         $res{'name'} = $4;
3419                 } else {
3420                         $res{'name'} = unquote($4);
3421                 }
3422         }
3423
3424         return wantarray ? %res : \%res;
3425 }
3426
3427 # generates _two_ hashes, references to which are passed as 2 and 3 argument
3428 sub parse_from_to_diffinfo {
3429         my ($diffinfo, $from, $to, @parents) = @_;
3430
3431         if ($diffinfo->{'nparents'}) {
3432                 # combined diff
3433                 $from->{'file'} = [];
3434                 $from->{'href'} = [];
3435                 fill_from_file_info($diffinfo, @parents)
3436                         unless exists $diffinfo->{'from_file'};
3437                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3438                         $from->{'file'}[$i] =
3439                                 defined $diffinfo->{'from_file'}[$i] ?
3440                                         $diffinfo->{'from_file'}[$i] :
3441                                         $diffinfo->{'to_file'};
3442                         if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3443                                 $from->{'href'}[$i] = href(action=>"blob",
3444                                                            hash_base=>$parents[$i],
3445                                                            hash=>$diffinfo->{'from_id'}[$i],
3446                                                            file_name=>$from->{'file'}[$i]);
3447                         } else {
3448                                 $from->{'href'}[$i] = undef;
3449                         }
3450                 }
3451         } else {
3452                 # ordinary (not combined) diff
3453                 $from->{'file'} = $diffinfo->{'from_file'};
3454                 if ($diffinfo->{'status'} ne "A") { # not new (added) file
3455                         $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3456                                                hash=>$diffinfo->{'from_id'},
3457                                                file_name=>$from->{'file'});
3458                 } else {
3459                         delete $from->{'href'};
3460                 }
3461         }
3462
3463         $to->{'file'} = $diffinfo->{'to_file'};
3464         if (!is_deleted($diffinfo)) { # file exists in result
3465                 $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3466                                      hash=>$diffinfo->{'to_id'},
3467                                      file_name=>$to->{'file'});
3468         } else {
3469                 delete $to->{'href'};
3470         }
3471 }
3472
3473 ## ......................................................................
3474 ## parse to array of hashes functions
3475
3476 sub git_get_heads_list {
3477         my ($limit, @classes) = @_;
3478         @classes = ('heads') unless @classes;
3479         my @patterns = map { "refs/$_" } @classes;
3480         my @headslist;
3481
3482         open my $fd, '-|', git_cmd(), 'for-each-ref',
3483                 ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3484                 '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3485                 @patterns
3486                 or return;
3487         while (my $line = <$fd>) {
3488                 my %ref_item;
3489
3490                 chomp $line;
3491                 my ($refinfo, $committerinfo) = split(/\0/, $line);
3492                 my ($hash, $name, $title) = split(' ', $refinfo, 3);
3493                 my ($committer, $epoch, $tz) =
3494                         ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3495                 $ref_item{'fullname'}  = $name;
3496                 $name =~ s!^refs/(?:head|remote)s/!!;
3497
3498                 $ref_item{'name'}  = $name;
3499                 $ref_item{'id'}    = $hash;
3500                 $ref_item{'title'} = $title || '(no commit message)';
3501                 $ref_item{'epoch'} = $epoch;
3502                 if ($epoch) {
3503                         $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3504                 } else {
3505                         $ref_item{'age'} = "unknown";
3506                 }
3507
3508                 push @headslist, \%ref_item;
3509         }
3510         close $fd;
3511
3512         return wantarray ? @headslist : \@headslist;
3513 }
3514
3515 sub git_get_tags_list {
3516         my $limit = shift;
3517         my @tagslist;
3518
3519         open my $fd, '-|', git_cmd(), 'for-each-ref',
3520                 ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3521                 '--format=%(objectname) %(objecttype) %(refname) '.
3522                 '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3523                 'refs/tags'
3524                 or return;
3525         while (my $line = <$fd>) {
3526                 my %ref_item;
3527
3528                 chomp $line;
3529                 my ($refinfo, $creatorinfo) = split(/\0/, $line);
3530                 my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3531                 my ($creator, $epoch, $tz) =
3532                         ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3533                 $ref_item{'fullname'} = $name;
3534                 $name =~ s!^refs/tags/!!;
3535
3536                 $ref_item{'type'} = $type;
3537                 $ref_item{'id'} = $id;
3538                 $ref_item{'name'} = $name;
3539                 if ($type eq "tag") {
3540                         $ref_item{'subject'} = $title;
3541                         $ref_item{'reftype'} = $reftype;
3542                         $ref_item{'refid'}   = $refid;
3543                 } else {
3544                         $ref_item{'reftype'} = $type;
3545                         $ref_item{'refid'}   = $id;
3546                 }
3547
3548                 if ($type eq "tag" || $type eq "commit") {
3549                         $ref_item{'epoch'} = $epoch;
3550                         if ($epoch) {
3551                                 $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3552                         } else {
3553                                 $ref_item{'age'} = "unknown";
3554                         }
3555                 }
3556
3557                 push @tagslist, \%ref_item;
3558         }
3559         close $fd;
3560
3561         return wantarray ? @tagslist : \@tagslist;
3562 }
3563
3564 ## ----------------------------------------------------------------------
3565 ## filesystem-related functions
3566
3567 sub get_file_owner {
3568         my $path = shift;
3569
3570         my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3571         my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3572         if (!defined $gcos) {
3573                 return undef;
3574         }
3575         my $owner = $gcos;
3576         $owner =~ s/[,;].*$//;
3577         return to_utf8($owner);
3578 }
3579
3580 # assume that file exists
3581 sub insert_file {
3582         my $filename = shift;
3583
3584         open my $fd, '<', $filename;
3585         print map { to_utf8($_) } <$fd>;
3586         close $fd;
3587 }
3588
3589 ## ......................................................................
3590 ## mimetype related functions
3591
3592 sub mimetype_guess_file {
3593         my $filename = shift;
3594         my $mimemap = shift;
3595         -r $mimemap or return undef;
3596
3597         my %mimemap;
3598         open(my $mh, '<', $mimemap) or return undef;
3599         while (<$mh>) {
3600                 next if m/^#/; # skip comments
3601                 my ($mimetype, @exts) = split(/\s+/);
3602                 foreach my $ext (@exts) {
3603                         $mimemap{$ext} = $mimetype;
3604                 }
3605         }
3606         close($mh);
3607
3608         $filename =~ /\.([^.]*)$/;
3609         return $mimemap{$1};
3610 }
3611
3612 sub mimetype_guess {
3613         my $filename = shift;
3614         my $mime;
3615         $filename =~ /\./ or return undef;
3616
3617         if ($mimetypes_file) {
3618                 my $file = $mimetypes_file;
3619                 if ($file !~ m!^/!) { # if it is relative path
3620                         # it is relative to project
3621                         $file = "$projectroot/$project/$file";
3622                 }
3623                 $mime = mimetype_guess_file($filename, $file);
3624         }
3625         $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3626         return $mime;
3627 }
3628
3629 sub blob_mimetype {
3630         my $fd = shift;
3631         my $filename = shift;
3632
3633         if ($filename) {
3634                 my $mime = mimetype_guess($filename);
3635                 $mime and return $mime;
3636         }
3637
3638         # just in case
3639         return $default_blob_plain_mimetype unless $fd;
3640
3641         if (-T $fd) {
3642                 return 'text/plain';
3643         } elsif (! $filename) {
3644                 return 'application/octet-stream';
3645         } elsif ($filename =~ m/\.png$/i) {
3646                 return 'image/png';
3647         } elsif ($filename =~ m/\.gif$/i) {
3648                 return 'image/gif';
3649         } elsif ($filename =~ m/\.jpe?g$/i) {
3650                 return 'image/jpeg';
3651         } else {
3652                 return 'application/octet-stream';
3653         }
3654 }
3655
3656 sub blob_contenttype {
3657         my ($fd, $file_name, $type) = @_;
3658
3659         $type ||= blob_mimetype($fd, $file_name);
3660         if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3661                 $type .= "; charset=$default_text_plain_charset";
3662         }
3663
3664         return $type;
3665 }
3666
3667 # guess file syntax for syntax highlighting; return undef if no highlighting
3668 # the name of syntax can (in the future) depend on syntax highlighter used
3669 sub guess_file_syntax {
3670         my ($highlight, $mimetype, $file_name) = @_;
3671         return undef unless ($highlight && defined $file_name);
3672         my $basename = basename($file_name, '.in');
3673         return $highlight_basename{$basename}
3674                 if exists $highlight_basename{$basename};
3675
3676         $basename =~ /\.([^.]*)$/;
3677         my $ext = $1 or return undef;
3678         return $highlight_ext{$ext}
3679                 if exists $highlight_ext{$ext};
3680
3681         return undef;
3682 }
3683
3684 # run highlighter and return FD of its output,
3685 # or return original FD if no highlighting
3686 sub run_highlighter {
3687         my ($fd, $highlight, $syntax) = @_;
3688         return $fd unless ($highlight && defined $syntax);
3689
3690         close $fd;
3691         open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3692                   quote_command($highlight_bin).
3693                   " --replace-tabs=8 --fragment --syntax $syntax |"
3694                 or die_error(500, "Couldn't open file or run syntax highlighter");
3695         return $fd;
3696 }
3697
3698 ## ======================================================================
3699 ## functions printing HTML: header, footer, error page
3700
3701 sub get_page_title {
3702         my $title = to_utf8($site_name);
3703
3704         return $title unless (defined $project);
3705         $title .= " - " . to_utf8($project);
3706
3707         return $title unless (defined $action);
3708         $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3709
3710         return $title unless (defined $file_name);
3711         $title .= " - " . esc_path($file_name);
3712         if ($action eq "tree" && $file_name !~ m|/$|) {
3713                 $title .= "/";
3714         }
3715
3716         return $title;
3717 }
3718
3719 sub get_content_type_html {
3720         # require explicit support from the UA if we are to send the page as
3721         # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3722         # we have to do this because MSIE sometimes globs '*/*', pretending to
3723         # support xhtml+xml but choking when it gets what it asked for.
3724         if (defined $cgi->http('HTTP_ACCEPT') &&
3725             $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3726             $cgi->Accept('application/xhtml+xml') != 0) {
3727                 return 'application/xhtml+xml';
3728         } else {
3729                 return 'text/html';
3730         }
3731 }
3732
3733 sub print_feed_meta {
3734         if (defined $project) {
3735                 my %href_params = get_feed_info();
3736                 if (!exists $href_params{'-title'}) {
3737                         $href_params{'-title'} = 'log';
3738                 }
3739
3740                 foreach my $format (qw(RSS Atom)) {
3741                         my $type = lc($format);
3742                         my %link_attr = (
3743                                 '-rel' => 'alternate',
3744                                 '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3745                                 '-type' => "application/$type+xml"
3746                         );
3747
3748                         $href_params{'action'} = $type;
3749                         $link_attr{'-href'} = href(%href_params);
3750                         print "<link ".
3751                               "rel=\"$link_attr{'-rel'}\" ".
3752                               "title=\"$link_attr{'-title'}\" ".
3753                               "href=\"$link_attr{'-href'}\" ".
3754                               "type=\"$link_attr{'-type'}\" ".
3755                               "/>\n";
3756
3757                         $href_params{'extra_options'} = '--no-merges';
3758                         $link_attr{'-href'} = href(%href_params);
3759                         $link_attr{'-title'} .= ' (no merges)';
3760                         print "<link ".
3761                               "rel=\"$link_attr{'-rel'}\" ".
3762                               "title=\"$link_attr{'-title'}\" ".
3763                               "href=\"$link_attr{'-href'}\" ".
3764                               "type=\"$link_attr{'-type'}\" ".
3765                               "/>\n";
3766                 }
3767
3768         } else {
3769                 printf('<link rel="alternate" title="%s projects list" '.
3770                        'href="%s" type="text/plain; charset=utf-8" />'."\n",
3771                        esc_attr($site_name), href(project=>undef, action=>"project_index"));
3772                 printf('<link rel="alternate" title="%s projects feeds" '.
3773                        'href="%s" type="text/x-opml" />'."\n",
3774                        esc_attr($site_name), href(project=>undef, action=>"opml"));
3775         }
3776 }
3777
3778 sub print_header_links {
3779         my $status = shift;
3780
3781         # print out each stylesheet that exist, providing backwards capability
3782         # for those people who defined $stylesheet in a config file
3783         if (defined $stylesheet) {
3784                 print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3785         } else {
3786                 foreach my $stylesheet (@stylesheets) {
3787                         next unless $stylesheet;
3788                         print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3789                 }
3790         }
3791         print_feed_meta()
3792                 if ($status eq '200 OK');
3793         if (defined $favicon) {
3794                 print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3795         }
3796 }
3797
3798 sub print_nav_breadcrumbs {
3799         my %opts = @_;
3800
3801         print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3802         if (defined $project) {
3803                 print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3804                 if (defined $action) {
3805                         my $action_print = $action ;
3806                         if (defined $opts{-action_extra}) {
3807                                 $action_print = $cgi->a({-href => href(action=>$action)},
3808                                         $action);
3809                         }
3810                         print " / $action_print";
3811                 }
3812                 if (defined $opts{-action_extra}) {
3813                         print " / $opts{-action_extra}";
3814                 }
3815                 print "\n";
3816         }
3817 }
3818
3819 sub print_search_form {
3820         if (!defined $searchtext) {
3821                 $searchtext = "";
3822         }
3823         my $search_hash;
3824         if (defined $hash_base) {
3825                 $search_hash = $hash_base;
3826         } elsif (defined $hash) {
3827                 $search_hash = $hash;
3828         } else {
3829                 $search_hash = "HEAD";
3830         }
3831         my $action = $my_uri;
3832         my $use_pathinfo = gitweb_check_feature('pathinfo');
3833         if ($use_pathinfo) {
3834                 $action .= "/".esc_url($project);
3835         }
3836         print $cgi->startform(-method => "get", -action => $action) .
3837               "<div class=\"search\">\n" .
3838               (!$use_pathinfo &&
3839               $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3840               $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3841               $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3842               $cgi->popup_menu(-name => 'st', -default => 'commit',
3843                                -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3844               $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3845               " search:\n",
3846               $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3847               "<span title=\"Extended regular expression\">" .
3848               $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3849                              -checked => $search_use_regexp) .
3850               "</span>" .
3851               "</div>" .
3852               $cgi->end_form() . "\n";
3853 }
3854
3855 sub git_header_html {
3856         my $status = shift || "200 OK";
3857         my $expires = shift;
3858         my %opts = @_;
3859
3860         my $title = get_page_title();
3861         my $content_type = get_content_type_html();
3862         print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3863                            -status=> $status, -expires => $expires)
3864                 unless ($opts{'-no_http_header'});
3865         my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3866         print <<EOF;
3867 <?xml version="1.0" encoding="utf-8"?>
3868 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3869 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3870 <!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3871 <!-- git core binaries version $git_version -->
3872 <head>
3873 <meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3874 <meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3875 <meta name="robots" content="index, nofollow"/>
3876 <title>$title</title>
3877 EOF
3878         # the stylesheet, favicon etc urls won't work correctly with path_info
3879         # unless we set the appropriate base URL
3880         if ($ENV{'PATH_INFO'}) {
3881                 print "<base href=\"".esc_url($base_url)."\" />\n";
3882         }
3883         print_header_links($status);
3884
3885         if (defined $site_html_head_string) {
3886                 print to_utf8($site_html_head_string);
3887         }
3888
3889         print "</head>\n" .
3890               "<body>\n";
3891
3892         if (defined $site_header && -f $site_header) {
3893                 insert_file($site_header);
3894         }
3895
3896         print "<div class=\"page_header\">\n";
3897         if (defined $logo) {
3898                 print $cgi->a({-href => esc_url($logo_url),
3899                                -title => $logo_label},
3900                               $cgi->img({-src => esc_url($logo),
3901                                          -width => 72, -height => 27,
3902                                          -alt => "git",
3903                                          -class => "logo"}));
3904         }
3905         print_nav_breadcrumbs(%opts);
3906         print "</div>\n";
3907
3908         my $have_search = gitweb_check_feature('search');
3909         if (defined $project && $have_search) {
3910                 print_search_form();
3911         }
3912 }
3913
3914 sub git_footer_html {
3915         my $feed_class = 'rss_logo';
3916
3917         print "<div class=\"page_footer\">\n";
3918         if (defined $project) {
3919                 my $descr = git_get_project_description($project);
3920                 if (defined $descr) {
3921                         print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3922                 }
3923
3924                 my %href_params = get_feed_info();
3925                 if (!%href_params) {
3926                         $feed_class .= ' generic';
3927                 }
3928                 $href_params{'-title'} ||= 'log';
3929
3930                 foreach my $format (qw(RSS Atom)) {
3931                         $href_params{'action'} = lc($format);
3932                         print $cgi->a({-href => href(%href_params),
3933                                       -title => "$href_params{'-title'} $format feed",
3934                                       -class => $feed_class}, $format)."\n";
3935                 }
3936
3937         } else {
3938                 print $cgi->a({-href => href(project=>undef, action=>"opml"),
3939                               -class => $feed_class}, "OPML") . " ";
3940                 print $cgi->a({-href => href(project=>undef, action=>"project_index"),
3941                               -class => $feed_class}, "TXT") . "\n";
3942         }
3943         print "</div>\n"; # class="page_footer"
3944
3945         if (defined $t0 && gitweb_check_feature('timed')) {
3946                 print "<div id=\"generating_info\">\n";
3947                 print 'This page took '.
3948                       '<span id="generating_time" class="time_span">'.
3949                       tv_interval($t0, [ gettimeofday() ]).
3950                       ' seconds </span>'.
3951                       ' and '.
3952                       '<span id="generating_cmd">'.
3953                       $number_of_git_cmds.
3954                       '</span> git commands '.
3955                       " to generate.\n";
3956                 print "</div>\n"; # class="page_footer"
3957         }
3958
3959         if (defined $site_footer && -f $site_footer) {
3960                 insert_file($site_footer);
3961         }
3962
3963         print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
3964         if (defined $action &&
3965             $action eq 'blame_incremental') {
3966                 print qq!<script type="text/javascript">\n!.
3967                       qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
3968                       qq!           "!. href() .qq!");\n!.
3969                       qq!</script>\n!;
3970         } else {
3971                 my ($jstimezone, $tz_cookie, $datetime_class) =
3972                         gitweb_get_feature('javascript-timezone');
3973
3974                 print qq!<script type="text/javascript">\n!.
3975                       qq!window.onload = function () {\n!;
3976                 if (gitweb_check_feature('javascript-actions')) {
3977                         print qq!       fixLinks();\n!;
3978                 }
3979                 if ($jstimezone && $tz_cookie && $datetime_class) {
3980                         print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
3981                               qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
3982                 }
3983                 print qq!};\n!.
3984                       qq!</script>\n!;
3985         }
3986
3987         print "</body>\n" .
3988               "</html>";
3989 }
3990
3991 # die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
3992 # Example: die_error(404, 'Hash not found')
3993 # By convention, use the following status codes (as defined in RFC 2616):
3994 # 400: Invalid or missing CGI parameters, or
3995 #      requested object exists but has wrong type.
3996 # 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
3997 #      this server or project.
3998 # 404: Requested object/revision/project doesn't exist.
3999 # 500: The server isn't configured properly, or
4000 #      an internal error occurred (e.g. failed assertions caused by bugs), or
4001 #      an unknown error occurred (e.g. the git binary died unexpectedly).
4002 # 503: The server is currently unavailable (because it is overloaded,
4003 #      or down for maintenance).  Generally, this is a temporary state.
4004 sub die_error {
4005         my $status = shift || 500;
4006         my $error = esc_html(shift) || "Internal Server Error";
4007         my $extra = shift;
4008         my %opts = @_;
4009
4010         my %http_responses = (
4011                 400 => '400 Bad Request',
4012                 403 => '403 Forbidden',
4013                 404 => '404 Not Found',
4014                 500 => '500 Internal Server Error',
4015                 503 => '503 Service Unavailable',
4016         );
4017         git_header_html($http_responses{$status}, undef, %opts);
4018         print <<EOF;
4019 <div class="page_body">
4020 <br /><br />
4021 $status - $error
4022 <br />
4023 EOF
4024         if (defined $extra) {
4025                 print "<hr />\n" .
4026                       "$extra\n";
4027         }
4028         print "</div>\n";
4029
4030         git_footer_html();
4031         goto DONE_GITWEB
4032                 unless ($opts{'-error_handler'});
4033 }
4034
4035 ## ----------------------------------------------------------------------
4036 ## functions printing or outputting HTML: navigation
4037
4038 sub git_print_page_nav {
4039         my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4040         $extra = '' if !defined $extra; # pager or formats
4041
4042         my @navs = qw(summary shortlog log commit commitdiff tree);
4043         if ($suppress) {
4044                 @navs = grep { $_ ne $suppress } @navs;
4045         }
4046
4047         my %arg = map { $_ => {action=>$_} } @navs;
4048         if (defined $head) {
4049                 for (qw(commit commitdiff)) {
4050                         $arg{$_}{'hash'} = $head;
4051                 }
4052                 if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4053                         for (qw(shortlog log)) {
4054                                 $arg{$_}{'hash'} = $head;
4055                         }
4056                 }
4057         }
4058
4059         $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4060         $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4061
4062         my @actions = gitweb_get_feature('actions');
4063         my %repl = (
4064                 '%' => '%',
4065                 'n' => $project,         # project name
4066                 'f' => $git_dir,         # project path within filesystem
4067                 'h' => $treehead || '',  # current hash ('h' parameter)
4068                 'b' => $treebase || '',  # hash base ('hb' parameter)
4069         );
4070         while (@actions) {
4071                 my ($label, $link, $pos) = splice(@actions,0,3);
4072                 # insert
4073                 @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4074                 # munch munch
4075                 $link =~ s/%([%nfhb])/$repl{$1}/g;
4076                 $arg{$label}{'_href'} = $link;
4077         }
4078
4079         print "<div class=\"page_nav\">\n" .
4080                 (join " | ",
4081                  map { $_ eq $current ?
4082                        $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4083                  } @navs);
4084         print "<br/>\n$extra<br/>\n" .
4085               "</div>\n";
4086 }
4087
4088 # returns a submenu for the nagivation of the refs views (tags, heads,
4089 # remotes) with the current view disabled and the remotes view only
4090 # available if the feature is enabled
4091 sub format_ref_views {
4092         my ($current) = @_;
4093         my @ref_views = qw{tags heads};
4094         push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4095         return join " | ", map {
4096                 $_ eq $current ? $_ :
4097                 $cgi->a({-href => href(action=>$_)}, $_)
4098         } @ref_views
4099 }
4100
4101 sub format_paging_nav {
4102         my ($action, $page, $has_next_link) = @_;
4103         my $paging_nav;
4104
4105
4106         if ($page > 0) {
4107                 $paging_nav .=
4108                         $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4109                         " &sdot; " .
4110                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
4111                                  -accesskey => "p", -title => "Alt-p"}, "prev");
4112         } else {
4113                 $paging_nav .= "first &sdot; prev";
4114         }
4115
4116         if ($has_next_link) {
4117                 $paging_nav .= " &sdot; " .
4118                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
4119                                  -accesskey => "n", -title => "Alt-n"}, "next");
4120         } else {
4121                 $paging_nav .= " &sdot; next";
4122         }
4123
4124         return $paging_nav;
4125 }
4126
4127 ## ......................................................................
4128 ## functions printing or outputting HTML: div
4129
4130 sub git_print_header_div {
4131         my ($action, $title, $hash, $hash_base) = @_;
4132         my %args = ();
4133
4134         $args{'action'} = $action;
4135         $args{'hash'} = $hash if $hash;
4136         $args{'hash_base'} = $hash_base if $hash_base;
4137
4138         print "<div class=\"header\">\n" .
4139               $cgi->a({-href => href(%args), -class => "title"},
4140               $title ? $title : $action) .
4141               "\n</div>\n";
4142 }
4143
4144 sub format_repo_url {
4145         my ($name, $url) = @_;
4146         return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4147 }
4148
4149 # Group output by placing it in a DIV element and adding a header.
4150 # Options for start_div() can be provided by passing a hash reference as the
4151 # first parameter to the function.
4152 # Options to git_print_header_div() can be provided by passing an array
4153 # reference. This must follow the options to start_div if they are present.
4154 # The content can be a scalar, which is output as-is, a scalar reference, which
4155 # is output after html escaping, an IO handle passed either as *handle or
4156 # *handle{IO}, or a function reference. In the latter case all following
4157 # parameters will be taken as argument to the content function call.
4158 sub git_print_section {
4159         my ($div_args, $header_args, $content);
4160         my $arg = shift;
4161         if (ref($arg) eq 'HASH') {
4162                 $div_args = $arg;
4163                 $arg = shift;
4164         }
4165         if (ref($arg) eq 'ARRAY') {
4166                 $header_args = $arg;
4167                 $arg = shift;
4168         }
4169         $content = $arg;
4170
4171         print $cgi->start_div($div_args);
4172         git_print_header_div(@$header_args);
4173
4174         if (ref($content) eq 'CODE') {
4175                 $content->(@_);
4176         } elsif (ref($content) eq 'SCALAR') {
4177                 print esc_html($$content);
4178         } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4179                 print <$content>;
4180         } elsif (!ref($content) && defined($content)) {
4181                 print $content;
4182         }
4183
4184         print $cgi->end_div;
4185 }
4186
4187 sub format_timestamp_html {
4188         my $date = shift;
4189         my $strtime = $date->{'rfc2822'};
4190
4191         my (undef, undef, $datetime_class) =
4192                 gitweb_get_feature('javascript-timezone');
4193         if ($datetime_class) {
4194                 $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4195         }
4196
4197         my $localtime_format = '(%02d:%02d %s)';
4198         if ($date->{'hour_local'} < 6) {
4199                 $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4200         }
4201         $strtime .= ' ' .
4202                     sprintf($localtime_format,
4203                             $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4204
4205         return $strtime;
4206 }
4207
4208 # Outputs the author name and date in long form
4209 sub git_print_authorship {
4210         my $co = shift;
4211         my %opts = @_;
4212         my $tag = $opts{-tag} || 'div';
4213         my $author = $co->{'author_name'};
4214
4215         my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4216         print "<$tag class=\"author_date\">" .
4217               format_search_author($author, "author", esc_html($author)) .
4218               " [".format_timestamp_html(\%ad)."]".
4219               git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4220               "</$tag>\n";
4221 }
4222
4223 # Outputs table rows containing the full author or committer information,
4224 # in the format expected for 'commit' view (& similar).
4225 # Parameters are a commit hash reference, followed by the list of people
4226 # to output information for. If the list is empty it defaults to both
4227 # author and committer.
4228 sub git_print_authorship_rows {
4229         my $co = shift;
4230         # too bad we can't use @people = @_ || ('author', 'committer')
4231         my @people = @_;
4232         @people = ('author', 'committer') unless @people;
4233         foreach my $who (@people) {
4234                 my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4235                 print "<tr><td>$who</td><td>" .
4236                       format_search_author($co->{"${who}_name"}, $who,
4237                                            esc_html($co->{"${who}_name"})) . " " .
4238                       format_search_author($co->{"${who}_email"}, $who,
4239                                            esc_html("<" . $co->{"${who}_email"} . ">")) .
4240                       "</td><td rowspan=\"2\">" .
4241                       git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4242                       "</td></tr>\n" .
4243                       "<tr>" .
4244                       "<td></td><td>" .
4245                       format_timestamp_html(\%wd) .
4246                       "</td>" .
4247                       "</tr>\n";
4248         }
4249 }
4250
4251 sub git_print_page_path {
4252         my $name = shift;
4253         my $type = shift;
4254         my $hb = shift;
4255
4256
4257         print "<div class=\"page_path\">";
4258         print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4259                       -title => 'tree root'}, to_utf8("[$project]"));
4260         print " / ";
4261         if (defined $name) {
4262                 my @dirname = split '/', $name;
4263                 my $basename = pop @dirname;
4264                 my $fullname = '';
4265
4266                 foreach my $dir (@dirname) {
4267                         $fullname .= ($fullname ? '/' : '') . $dir;
4268                         print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4269                                                      hash_base=>$hb),
4270                                       -title => $fullname}, esc_path($dir));
4271                         print " / ";
4272                 }
4273                 if (defined $type && $type eq 'blob') {
4274                         print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4275                                                      hash_base=>$hb),
4276                                       -title => $name}, esc_path($basename));
4277                 } elsif (defined $type && $type eq 'tree') {
4278                         print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4279                                                      hash_base=>$hb),
4280                                       -title => $name}, esc_path($basename));
4281                         print " / ";
4282                 } else {
4283                         print esc_path($basename);
4284                 }
4285         }
4286         print "<br/></div>\n";
4287 }
4288
4289 sub git_print_log {
4290         my $log = shift;
4291         my %opts = @_;
4292
4293         if ($opts{'-remove_title'}) {
4294                 # remove title, i.e. first line of log
4295                 shift @$log;
4296         }
4297         # remove leading empty lines
4298         while (defined $log->[0] && $log->[0] eq "") {
4299                 shift @$log;
4300         }
4301
4302         # print log
4303         my $signoff = 0;
4304         my $empty = 0;
4305         foreach my $line (@$log) {
4306                 if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4307                         $signoff = 1;
4308                         $empty = 0;
4309                         if (! $opts{'-remove_signoff'}) {
4310                                 print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4311                                 next;
4312                         } else {
4313                                 # remove signoff lines
4314                                 next;
4315                         }
4316                 } else {
4317                         $signoff = 0;
4318                 }
4319
4320                 # print only one empty line
4321                 # do not print empty line after signoff
4322                 if ($line eq "") {
4323                         next if ($empty || $signoff);
4324                         $empty = 1;
4325                 } else {
4326                         $empty = 0;
4327                 }
4328
4329                 print format_log_line_html($line) . "<br/>\n";
4330         }
4331
4332         if ($opts{'-final_empty_line'}) {
4333                 # end with single empty line
4334                 print "<br/>\n" unless $empty;
4335         }
4336 }
4337
4338 # return link target (what link points to)
4339 sub git_get_link_target {
4340         my $hash = shift;
4341         my $link_target;
4342
4343         # read link
4344         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4345                 or return;
4346         {
4347                 local $/ = undef;
4348                 $link_target = <$fd>;
4349         }
4350         close $fd
4351                 or return;
4352
4353         return $link_target;
4354 }
4355
4356 # given link target, and the directory (basedir) the link is in,
4357 # return target of link relative to top directory (top tree);
4358 # return undef if it is not possible (including absolute links).
4359 sub normalize_link_target {
4360         my ($link_target, $basedir) = @_;
4361
4362         # absolute symlinks (beginning with '/') cannot be normalized
4363         return if (substr($link_target, 0, 1) eq '/');
4364
4365         # normalize link target to path from top (root) tree (dir)
4366         my $path;
4367         if ($basedir) {
4368                 $path = $basedir . '/' . $link_target;
4369         } else {
4370                 # we are in top (root) tree (dir)
4371                 $path = $link_target;
4372         }
4373
4374         # remove //, /./, and /../
4375         my @path_parts;
4376         foreach my $part (split('/', $path)) {
4377                 # discard '.' and ''
4378                 next if (!$part || $part eq '.');
4379                 # handle '..'
4380                 if ($part eq '..') {
4381                         if (@path_parts) {
4382                                 pop @path_parts;
4383                         } else {
4384                                 # link leads outside repository (outside top dir)
4385                                 return;
4386                         }
4387                 } else {
4388                         push @path_parts, $part;
4389                 }
4390         }
4391         $path = join('/', @path_parts);
4392
4393         return $path;
4394 }
4395
4396 # print tree entry (row of git_tree), but without encompassing <tr> element
4397 sub git_print_tree_entry {
4398         my ($t, $basedir, $hash_base, $have_blame) = @_;
4399
4400         my %base_key = ();
4401         $base_key{'hash_base'} = $hash_base if defined $hash_base;
4402
4403         # The format of a table row is: mode list link.  Where mode is
4404         # the mode of the entry, list is the name of the entry, an href,
4405         # and link is the action links of the entry.
4406
4407         print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4408         if (exists $t->{'size'}) {
4409                 print "<td class=\"size\">$t->{'size'}</td>\n";
4410         }
4411         if ($t->{'type'} eq "blob") {
4412                 print "<td class=\"list\">" .
4413                         $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4414                                                file_name=>"$basedir$t->{'name'}", %base_key),
4415                                 -class => "list"}, esc_path($t->{'name'}));
4416                 if (S_ISLNK(oct $t->{'mode'})) {
4417                         my $link_target = git_get_link_target($t->{'hash'});
4418                         if ($link_target) {
4419                                 my $norm_target = normalize_link_target($link_target, $basedir);
4420                                 if (defined $norm_target) {
4421                                         print " -> " .
4422                                               $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4423                                                                      file_name=>$norm_target),
4424                                                        -title => $norm_target}, esc_path($link_target));
4425                                 } else {
4426                                         print " -> " . esc_path($link_target);
4427                                 }
4428                         }
4429                 }
4430                 print "</td>\n";
4431                 print "<td class=\"link\">";
4432                 print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4433                                              file_name=>"$basedir$t->{'name'}", %base_key)},
4434                               "blob");
4435                 if ($have_blame) {
4436                         print " | " .
4437                               $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4438                                                      file_name=>"$basedir$t->{'name'}", %base_key)},
4439                                       "blame");
4440                 }
4441                 if (defined $hash_base) {
4442                         print " | " .
4443                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4444                                                      hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4445                                       "history");
4446                 }
4447                 print " | " .
4448                         $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4449                                                file_name=>"$basedir$t->{'name'}")},
4450                                 "raw");
4451                 print "</td>\n";
4452
4453         } elsif ($t->{'type'} eq "tree") {
4454                 print "<td class=\"list\">";
4455                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4456                                              file_name=>"$basedir$t->{'name'}",
4457                                              %base_key)},
4458                               esc_path($t->{'name'}));
4459                 print "</td>\n";
4460                 print "<td class=\"link\">";
4461                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4462                                              file_name=>"$basedir$t->{'name'}",
4463                                              %base_key)},
4464                               "tree");
4465                 if (defined $hash_base) {
4466                         print " | " .
4467                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4468                                                      file_name=>"$basedir$t->{'name'}")},
4469                                       "history");
4470                 }
4471                 print "</td>\n";
4472         } else {
4473                 # unknown object: we can only present history for it
4474                 # (this includes 'commit' object, i.e. submodule support)
4475                 print "<td class=\"list\">" .
4476                       esc_path($t->{'name'}) .
4477                       "</td>\n";
4478                 print "<td class=\"link\">";
4479                 if (defined $hash_base) {
4480                         print $cgi->a({-href => href(action=>"history",
4481                                                      hash_base=>$hash_base,
4482                                                      file_name=>"$basedir$t->{'name'}")},
4483                                       "history");
4484                 }
4485                 print "</td>\n";
4486         }
4487 }
4488
4489 ## ......................................................................
4490 ## functions printing large fragments of HTML
4491
4492 # get pre-image filenames for merge (combined) diff
4493 sub fill_from_file_info {
4494         my ($diff, @parents) = @_;
4495
4496         $diff->{'from_file'} = [ ];
4497         $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4498         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4499                 if ($diff->{'status'}[$i] eq 'R' ||
4500                     $diff->{'status'}[$i] eq 'C') {
4501                         $diff->{'from_file'}[$i] =
4502                                 git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4503                 }
4504         }
4505
4506         return $diff;
4507 }
4508
4509 # is current raw difftree line of file deletion
4510 sub is_deleted {
4511         my $diffinfo = shift;
4512
4513         return $diffinfo->{'to_id'} eq ('0' x 40);
4514 }
4515
4516 # does patch correspond to [previous] difftree raw line
4517 # $diffinfo  - hashref of parsed raw diff format
4518 # $patchinfo - hashref of parsed patch diff format
4519 #              (the same keys as in $diffinfo)
4520 sub is_patch_split {
4521         my ($diffinfo, $patchinfo) = @_;
4522
4523         return defined $diffinfo && defined $patchinfo
4524                 && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4525 }
4526
4527
4528 sub git_difftree_body {
4529         my ($difftree, $hash, @parents) = @_;
4530         my ($parent) = $parents[0];
4531         my $have_blame = gitweb_check_feature('blame');
4532         print "<div class=\"list_head\">\n";
4533         if ($#{$difftree} > 10) {
4534                 print(($#{$difftree} + 1) . " files changed:\n");
4535         }
4536         print "</div>\n";
4537
4538         print "<table class=\"" .
4539               (@parents > 1 ? "combined " : "") .
4540               "diff_tree\">\n";
4541
4542         # header only for combined diff in 'commitdiff' view
4543         my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4544         if ($has_header) {
4545                 # table header
4546                 print "<thead><tr>\n" .
4547                        "<th></th><th></th>\n"; # filename, patchN link
4548                 for (my $i = 0; $i < @parents; $i++) {
4549                         my $par = $parents[$i];
4550                         print "<th>" .
4551                               $cgi->a({-href => href(action=>"commitdiff",
4552                                                      hash=>$hash, hash_parent=>$par),
4553                                        -title => 'commitdiff to parent number ' .
4554                                                   ($i+1) . ': ' . substr($par,0,7)},
4555                                       $i+1) .
4556                               "&nbsp;</th>\n";
4557                 }
4558                 print "</tr></thead>\n<tbody>\n";
4559         }
4560
4561         my $alternate = 1;
4562         my $patchno = 0;
4563         foreach my $line (@{$difftree}) {
4564                 my $diff = parsed_difftree_line($line);
4565
4566                 if ($alternate) {
4567                         print "<tr class=\"dark\">\n";
4568                 } else {
4569                         print "<tr class=\"light\">\n";
4570                 }
4571                 $alternate ^= 1;
4572
4573                 if (exists $diff->{'nparents'}) { # combined diff
4574
4575                         fill_from_file_info($diff, @parents)
4576                                 unless exists $diff->{'from_file'};
4577
4578                         if (!is_deleted($diff)) {
4579                                 # file exists in the result (child) commit
4580                                 print "<td>" .
4581                                       $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4582                                                              file_name=>$diff->{'to_file'},
4583                                                              hash_base=>$hash),
4584                                               -class => "list"}, esc_path($diff->{'to_file'})) .
4585                                       "</td>\n";
4586                         } else {
4587                                 print "<td>" .
4588                                       esc_path($diff->{'to_file'}) .
4589                                       "</td>\n";
4590                         }
4591
4592                         if ($action eq 'commitdiff') {
4593                                 # link to patch
4594                                 $patchno++;
4595                                 print "<td class=\"link\">" .
4596                                       $cgi->a({-href => href(-anchor=>"patch$patchno")},
4597                                               "patch") .
4598                                       " | " .
4599                                       "</td>\n";
4600                         }
4601
4602                         my $has_history = 0;
4603                         my $not_deleted = 0;
4604                         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4605                                 my $hash_parent = $parents[$i];
4606                                 my $from_hash = $diff->{'from_id'}[$i];
4607                                 my $from_path = $diff->{'from_file'}[$i];
4608                                 my $status = $diff->{'status'}[$i];
4609
4610                                 $has_history ||= ($status ne 'A');
4611                                 $not_deleted ||= ($status ne 'D');
4612
4613                                 if ($status eq 'A') {
4614                                         print "<td  class=\"link\" align=\"right\"> | </td>\n";
4615                                 } elsif ($status eq 'D') {
4616                                         print "<td class=\"link\">" .
4617                                               $cgi->a({-href => href(action=>"blob",
4618                                                                      hash_base=>$hash,
4619                                                                      hash=>$from_hash,
4620                                                                      file_name=>$from_path)},
4621                                                       "blob" . ($i+1)) .
4622                                               " | </td>\n";
4623                                 } else {
4624                                         if ($diff->{'to_id'} eq $from_hash) {
4625                                                 print "<td class=\"link nochange\">";
4626                                         } else {
4627                                                 print "<td class=\"link\">";
4628                                         }
4629                                         print $cgi->a({-href => href(action=>"blobdiff",
4630                                                                      hash=>$diff->{'to_id'},
4631                                                                      hash_parent=>$from_hash,
4632                                                                      hash_base=>$hash,
4633                                                                      hash_parent_base=>$hash_parent,
4634                                                                      file_name=>$diff->{'to_file'},
4635                                                                      file_parent=>$from_path)},
4636                                                       "diff" . ($i+1)) .
4637                                               " | </td>\n";
4638                                 }
4639                         }
4640
4641                         print "<td class=\"link\">";
4642                         if ($not_deleted) {
4643                                 print $cgi->a({-href => href(action=>"blob",
4644                                                              hash=>$diff->{'to_id'},
4645                                                              file_name=>$diff->{'to_file'},
4646                                                              hash_base=>$hash)},
4647                                               "blob");
4648                                 print " | " if ($has_history);
4649                         }
4650                         if ($has_history) {
4651                                 print $cgi->a({-href => href(action=>"history",
4652                                                              file_name=>$diff->{'to_file'},
4653                                                              hash_base=>$hash)},
4654                                               "history");
4655                         }
4656                         print "</td>\n";
4657
4658                         print "</tr>\n";
4659                         next; # instead of 'else' clause, to avoid extra indent
4660                 }
4661                 # else ordinary diff
4662
4663                 my ($to_mode_oct, $to_mode_str, $to_file_type);
4664                 my ($from_mode_oct, $from_mode_str, $from_file_type);
4665                 if ($diff->{'to_mode'} ne ('0' x 6)) {
4666                         $to_mode_oct = oct $diff->{'to_mode'};
4667                         if (S_ISREG($to_mode_oct)) { # only for regular file
4668                                 $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4669                         }
4670                         $to_file_type = file_type($diff->{'to_mode'});
4671                 }
4672                 if ($diff->{'from_mode'} ne ('0' x 6)) {
4673                         $from_mode_oct = oct $diff->{'from_mode'};
4674                         if (S_ISREG($from_mode_oct)) { # only for regular file
4675                                 $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4676                         }
4677                         $from_file_type = file_type($diff->{'from_mode'});
4678                 }
4679
4680                 if ($diff->{'status'} eq "A") { # created
4681                         my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4682                         $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4683                         $mode_chng   .= "]</span>";
4684                         print "<td>";
4685                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4686                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4687                                       -class => "list"}, esc_path($diff->{'file'}));
4688                         print "</td>\n";
4689                         print "<td>$mode_chng</td>\n";
4690                         print "<td class=\"link\">";
4691                         if ($action eq 'commitdiff') {
4692                                 # link to patch
4693                                 $patchno++;
4694                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4695                                               "patch") .
4696                                       " | ";
4697                         }
4698                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4699                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4700                                       "blob");
4701                         print "</td>\n";
4702
4703                 } elsif ($diff->{'status'} eq "D") { # deleted
4704                         my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4705                         print "<td>";
4706                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4707                                                      hash_base=>$parent, file_name=>$diff->{'file'}),
4708                                        -class => "list"}, esc_path($diff->{'file'}));
4709                         print "</td>\n";
4710                         print "<td>$mode_chng</td>\n";
4711                         print "<td class=\"link\">";
4712                         if ($action eq 'commitdiff') {
4713                                 # link to patch
4714                                 $patchno++;
4715                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4716                                               "patch") .
4717                                       " | ";
4718                         }
4719                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4720                                                      hash_base=>$parent, file_name=>$diff->{'file'})},
4721                                       "blob") . " | ";
4722                         if ($have_blame) {
4723                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4724                                                              file_name=>$diff->{'file'})},
4725                                               "blame") . " | ";
4726                         }
4727                         print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4728                                                      file_name=>$diff->{'file'})},
4729                                       "history");
4730                         print "</td>\n";
4731
4732                 } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4733                         my $mode_chnge = "";
4734                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4735                                 $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4736                                 if ($from_file_type ne $to_file_type) {
4737                                         $mode_chnge .= " from $from_file_type to $to_file_type";
4738                                 }
4739                                 if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4740                                         if ($from_mode_str && $to_mode_str) {
4741                                                 $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4742                                         } elsif ($to_mode_str) {
4743                                                 $mode_chnge .= " mode: $to_mode_str";
4744                                         }
4745                                 }
4746                                 $mode_chnge .= "]</span>\n";
4747                         }
4748                         print "<td>";
4749                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4750                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4751                                       -class => "list"}, esc_path($diff->{'file'}));
4752                         print "</td>\n";
4753                         print "<td>$mode_chnge</td>\n";
4754                         print "<td class=\"link\">";
4755                         if ($action eq 'commitdiff') {
4756                                 # link to patch
4757                                 $patchno++;
4758                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4759                                               "patch") .
4760                                       " | ";
4761                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4762                                 # "commit" view and modified file (not onlu mode changed)
4763                                 print $cgi->a({-href => href(action=>"blobdiff",
4764                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4765                                                              hash_base=>$hash, hash_parent_base=>$parent,
4766                                                              file_name=>$diff->{'file'})},
4767                                               "diff") .
4768                                       " | ";
4769                         }
4770                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4771                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4772                                        "blob") . " | ";
4773                         if ($have_blame) {
4774                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4775                                                              file_name=>$diff->{'file'})},
4776                                               "blame") . " | ";
4777                         }
4778                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4779                                                      file_name=>$diff->{'file'})},
4780                                       "history");
4781                         print "</td>\n";
4782
4783                 } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4784                         my %status_name = ('R' => 'moved', 'C' => 'copied');
4785                         my $nstatus = $status_name{$diff->{'status'}};
4786                         my $mode_chng = "";
4787                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4788                                 # mode also for directories, so we cannot use $to_mode_str
4789                                 $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4790                         }
4791                         print "<td>" .
4792                               $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4793                                                      hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4794                                       -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4795                               "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4796                               $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4797                                                      hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4798                                       -class => "list"}, esc_path($diff->{'from_file'})) .
4799                               " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4800                               "<td class=\"link\">";
4801                         if ($action eq 'commitdiff') {
4802                                 # link to patch
4803                                 $patchno++;
4804                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4805                                               "patch") .
4806                                       " | ";
4807                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4808                                 # "commit" view and modified file (not only pure rename or copy)
4809                                 print $cgi->a({-href => href(action=>"blobdiff",
4810                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4811                                                              hash_base=>$hash, hash_parent_base=>$parent,
4812                                                              file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4813                                               "diff") .
4814                                       " | ";
4815                         }
4816                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4817                                                      hash_base=>$parent, file_name=>$diff->{'to_file'})},
4818                                       "blob") . " | ";
4819                         if ($have_blame) {
4820                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4821                                                              file_name=>$diff->{'to_file'})},
4822                                               "blame") . " | ";
4823                         }
4824                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4825                                                     file_name=>$diff->{'to_file'})},
4826                                       "history");
4827                         print "</td>\n";
4828
4829                 } # we should not encounter Unmerged (U) or Unknown (X) status
4830                 print "</tr>\n";
4831         }
4832         print "</tbody>" if $has_header;
4833         print "</table>\n";
4834 }
4835
4836 sub git_patchset_body {
4837         my ($fd, $difftree, $hash, @hash_parents) = @_;
4838         my ($hash_parent) = $hash_parents[0];
4839
4840         my $is_combined = (@hash_parents > 1);
4841         my $patch_idx = 0;
4842         my $patch_number = 0;
4843         my $patch_line;
4844         my $diffinfo;
4845         my $to_name;
4846         my (%from, %to);
4847
4848         print "<div class=\"patchset\">\n";
4849
4850         # skip to first patch
4851         while ($patch_line = <$fd>) {
4852                 chomp $patch_line;
4853
4854                 last if ($patch_line =~ m/^diff /);
4855         }
4856
4857  PATCH:
4858         while ($patch_line) {
4859
4860                 # parse "git diff" header line
4861                 if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
4862                         # $1 is from_name, which we do not use
4863                         $to_name = unquote($2);
4864                         $to_name =~ s!^b/!!;
4865                 } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
4866                         # $1 is 'cc' or 'combined', which we do not use
4867                         $to_name = unquote($2);
4868                 } else {
4869                         $to_name = undef;
4870                 }
4871
4872                 # check if current patch belong to current raw line
4873                 # and parse raw git-diff line if needed
4874                 if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
4875                         # this is continuation of a split patch
4876                         print "<div class=\"patch cont\">\n";
4877                 } else {
4878                         # advance raw git-diff output if needed
4879                         $patch_idx++ if defined $diffinfo;
4880
4881                         # read and prepare patch information
4882                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4883
4884                         # compact combined diff output can have some patches skipped
4885                         # find which patch (using pathname of result) we are at now;
4886                         if ($is_combined) {
4887                                 while ($to_name ne $diffinfo->{'to_file'}) {
4888                                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4889                                               format_diff_cc_simplified($diffinfo, @hash_parents) .
4890                                               "</div>\n";  # class="patch"
4891
4892                                         $patch_idx++;
4893                                         $patch_number++;
4894
4895                                         last if $patch_idx > $#$difftree;
4896                                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4897                                 }
4898                         }
4899
4900                         # modifies %from, %to hashes
4901                         parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
4902
4903                         # this is first patch for raw difftree line with $patch_idx index
4904                         # we index @$difftree array from 0, but number patches from 1
4905                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
4906                 }
4907
4908                 # git diff header
4909                 #assert($patch_line =~ m/^diff /) if DEBUG;
4910                 #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
4911                 $patch_number++;
4912                 # print "git diff" header
4913                 print format_git_diff_header_line($patch_line, $diffinfo,
4914                                                   \%from, \%to);
4915
4916                 # print extended diff header
4917                 print "<div class=\"diff extended_header\">\n";
4918         EXTENDED_HEADER:
4919                 while ($patch_line = <$fd>) {
4920                         chomp $patch_line;
4921
4922                         last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
4923
4924                         print format_extended_diff_header_line($patch_line, $diffinfo,
4925                                                                \%from, \%to);
4926                 }
4927                 print "</div>\n"; # class="diff extended_header"
4928
4929                 # from-file/to-file diff header
4930                 if (! $patch_line) {
4931                         print "</div>\n"; # class="patch"
4932                         last PATCH;
4933                 }
4934                 next PATCH if ($patch_line =~ m/^diff /);
4935                 #assert($patch_line =~ m/^---/) if DEBUG;
4936
4937                 my $last_patch_line = $patch_line;
4938                 $patch_line = <$fd>;
4939                 chomp $patch_line;
4940                 #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
4941
4942                 print format_diff_from_to_header($last_patch_line, $patch_line,
4943                                                  $diffinfo, \%from, \%to,
4944                                                  @hash_parents);
4945
4946                 # the patch itself
4947         LINE:
4948                 while ($patch_line = <$fd>) {
4949                         chomp $patch_line;
4950
4951                         next PATCH if ($patch_line =~ m/^diff /);
4952
4953                         print format_diff_line($patch_line, \%from, \%to);
4954                 }
4955
4956         } continue {
4957                 print "</div>\n"; # class="patch"
4958         }
4959
4960         # for compact combined (--cc) format, with chunk and patch simplification
4961         # the patchset might be empty, but there might be unprocessed raw lines
4962         for (++$patch_idx if $patch_number > 0;
4963              $patch_idx < @$difftree;
4964              ++$patch_idx) {
4965                 # read and prepare patch information
4966                 $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4967
4968                 # generate anchor for "patch" links in difftree / whatchanged part
4969                 print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4970                       format_diff_cc_simplified($diffinfo, @hash_parents) .
4971                       "</div>\n";  # class="patch"
4972
4973                 $patch_number++;
4974         }
4975
4976         if ($patch_number == 0) {
4977                 if (@hash_parents > 1) {
4978                         print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
4979                 } else {
4980                         print "<div class=\"diff nodifferences\">No differences found</div>\n";
4981                 }
4982         }
4983
4984         print "</div>\n"; # class="patchset"
4985 }
4986
4987 # . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
4988
4989 # fills project list info (age, description, owner, category, forks)
4990 # for each project in the list, removing invalid projects from
4991 # returned list
4992 # NOTE: modifies $projlist, but does not remove entries from it
4993 sub fill_project_list_info {
4994         my $projlist = shift;
4995         my @projects;
4996
4997         my $show_ctags = gitweb_check_feature('ctags');
4998  PROJECT:
4999         foreach my $pr (@$projlist) {
5000                 my (@activity) = git_get_last_activity($pr->{'path'});
5001                 unless (@activity) {
5002                         next PROJECT;
5003                 }
5004                 ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5005                 if (!defined $pr->{'descr'}) {
5006                         my $descr = git_get_project_description($pr->{'path'}) || "";
5007                         $descr = to_utf8($descr);
5008                         $pr->{'descr_long'} = $descr;
5009                         $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5010                 }
5011                 if (!defined $pr->{'owner'}) {
5012                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5013                 }
5014                 if ($show_ctags) {
5015                         $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5016                 }
5017                 if ($projects_list_group_categories && !defined $pr->{'category'}) {
5018                         my $cat = git_get_project_category($pr->{'path'}) ||
5019                                                            $project_list_default_category;
5020                         $pr->{'category'} = to_utf8($cat);
5021                 }
5022
5023                 push @projects, $pr;
5024         }
5025
5026         return @projects;
5027 }
5028
5029 sub sort_projects_list {
5030         my ($projlist, $order) = @_;
5031         my @projects;
5032
5033         my %order_info = (
5034                 project => { key => 'path', type => 'str' },
5035                 descr => { key => 'descr_long', type => 'str' },
5036                 owner => { key => 'owner', type => 'str' },
5037                 age => { key => 'age', type => 'num' }
5038         );
5039         my $oi = $order_info{$order};
5040         return @$projlist unless defined $oi;
5041         if ($oi->{'type'} eq 'str') {
5042                 @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5043         } else {
5044                 @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5045         }
5046
5047         return @projects;
5048 }
5049
5050 # returns a hash of categories, containing the list of project
5051 # belonging to each category
5052 sub build_projlist_by_category {
5053         my ($projlist, $from, $to) = @_;
5054         my %categories;
5055
5056         $from = 0 unless defined $from;
5057         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5058
5059         for (my $i = $from; $i <= $to; $i++) {
5060                 my $pr = $projlist->[$i];
5061                 push @{$categories{ $pr->{'category'} }}, $pr;
5062         }
5063
5064         return wantarray ? %categories : \%categories;
5065 }
5066
5067 # print 'sort by' <th> element, generating 'sort by $name' replay link
5068 # if that order is not selected
5069 sub print_sort_th {
5070         print format_sort_th(@_);
5071 }
5072
5073 sub format_sort_th {
5074         my ($name, $order, $header) = @_;
5075         my $sort_th = "";
5076         $header ||= ucfirst($name);
5077
5078         if ($order eq $name) {
5079                 $sort_th .= "<th>$header</th>\n";
5080         } else {
5081                 $sort_th .= "<th>" .
5082                             $cgi->a({-href => href(-replay=>1, order=>$name),
5083                                      -class => "header"}, $header) .
5084                             "</th>\n";
5085         }
5086
5087         return $sort_th;
5088 }
5089
5090 sub git_project_list_rows {
5091         my ($projlist, $from, $to, $check_forks) = @_;
5092
5093         $from = 0 unless defined $from;
5094         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5095
5096         my $alternate = 1;
5097         for (my $i = $from; $i <= $to; $i++) {
5098                 my $pr = $projlist->[$i];
5099
5100                 if ($alternate) {
5101                         print "<tr class=\"dark\">\n";
5102                 } else {
5103                         print "<tr class=\"light\">\n";
5104                 }
5105                 $alternate ^= 1;
5106
5107                 if ($check_forks) {
5108                         print "<td>";
5109                         if ($pr->{'forks'}) {
5110                                 my $nforks = scalar @{$pr->{'forks'}};
5111                                 if ($nforks > 0) {
5112                                         print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5113                                                        -title => "$nforks forks"}, "+");
5114                                 } else {
5115                                         print $cgi->span({-title => "$nforks forks"}, "+");
5116                                 }
5117                         }
5118                         print "</td>\n";
5119                 }
5120                 print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5121                                         -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
5122                       "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5123                                         -class => "list", -title => $pr->{'descr_long'}},
5124                                         esc_html($pr->{'descr'})) . "</td>\n" .
5125                       "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5126                 print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5127                       (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
5128                       "<td class=\"link\">" .
5129                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5130                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5131                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5132                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5133                       ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5134                       "</td>\n" .
5135                       "</tr>\n";
5136         }
5137 }
5138
5139 sub git_project_list_body {
5140         # actually uses global variable $project
5141         my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5142         my @projects = @$projlist;
5143
5144         my $check_forks = gitweb_check_feature('forks');
5145         my $show_ctags  = gitweb_check_feature('ctags');
5146         my $tagfilter = $show_ctags ? $cgi->param('by_tag') : undef;
5147         $check_forks = undef
5148                 if ($tagfilter || $searchtext);
5149
5150         # filtering out forks before filling info allows to do less work
5151         @projects = filter_forks_from_projects_list(\@projects)
5152                 if ($check_forks);
5153         @projects = fill_project_list_info(\@projects);
5154         # searching projects require filling to be run before it
5155         @projects = search_projects_list(\@projects,
5156                                          'searchtext' => $searchtext,
5157                                          'tagfilter'  => $tagfilter)
5158                 if ($tagfilter || $searchtext);
5159
5160         $order ||= $default_projects_order;
5161         $from = 0 unless defined $from;
5162         $to = $#projects if (!defined $to || $#projects < $to);
5163
5164         # short circuit
5165         if ($from > $to) {
5166                 print "<center>\n".
5167                       "<b>No such projects found</b><br />\n".
5168                       "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5169                       "</center>\n<br />\n";
5170                 return;
5171         }
5172
5173         @projects = sort_projects_list(\@projects, $order);
5174
5175         if ($show_ctags) {
5176                 my $ctags = git_gather_all_ctags(\@projects);
5177                 my $cloud = git_populate_project_tagcloud($ctags);
5178                 print git_show_project_tagcloud($cloud, 64);
5179         }
5180
5181         print "<table class=\"project_list\">\n";
5182         unless ($no_header) {
5183                 print "<tr>\n";
5184                 if ($check_forks) {
5185                         print "<th></th>\n";
5186                 }
5187                 print_sort_th('project', $order, 'Project');
5188                 print_sort_th('descr', $order, 'Description');
5189                 print_sort_th('owner', $order, 'Owner');
5190                 print_sort_th('age', $order, 'Last Change');
5191                 print "<th></th>\n" . # for links
5192                       "</tr>\n";
5193         }
5194
5195         if ($projects_list_group_categories) {
5196                 # only display categories with projects in the $from-$to window
5197                 @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5198                 my %categories = build_projlist_by_category(\@projects, $from, $to);
5199                 foreach my $cat (sort keys %categories) {
5200                         unless ($cat eq "") {
5201                                 print "<tr>\n";
5202                                 if ($check_forks) {
5203                                         print "<td></td>\n";
5204                                 }
5205                                 print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5206                                 print "</tr>\n";
5207                         }
5208
5209                         git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5210                 }
5211         } else {
5212                 git_project_list_rows(\@projects, $from, $to, $check_forks);
5213         }
5214
5215         if (defined $extra) {
5216                 print "<tr>\n";
5217                 if ($check_forks) {
5218                         print "<td></td>\n";
5219                 }
5220                 print "<td colspan=\"5\">$extra</td>\n" .
5221                       "</tr>\n";
5222         }
5223         print "</table>\n";
5224 }
5225
5226 sub git_log_body {
5227         # uses global variable $project
5228         my ($commitlist, $from, $to, $refs, $extra) = @_;
5229
5230         $from = 0 unless defined $from;
5231         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5232
5233         for (my $i = 0; $i <= $to; $i++) {
5234                 my %co = %{$commitlist->[$i]};
5235                 next if !%co;
5236                 my $commit = $co{'id'};
5237                 my $ref = format_ref_marker($refs, $commit);
5238                 git_print_header_div('commit',
5239                                "<span class=\"age\">$co{'age_string'}</span>" .
5240                                esc_html($co{'title'}) . $ref,
5241                                $commit);
5242                 print "<div class=\"title_text\">\n" .
5243                       "<div class=\"log_link\">\n" .
5244                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5245                       " | " .
5246                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5247                       " | " .
5248                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5249                       "<br/>\n" .
5250                       "</div>\n";
5251                       git_print_authorship(\%co, -tag => 'span');
5252                       print "<br/>\n</div>\n";
5253
5254                 print "<div class=\"log_body\">\n";
5255                 git_print_log($co{'comment'}, -final_empty_line=> 1);
5256                 print "</div>\n";
5257         }
5258         if ($extra) {
5259                 print "<div class=\"page_nav\">\n";
5260                 print "$extra\n";
5261                 print "</div>\n";
5262         }
5263 }
5264
5265 sub git_shortlog_body {
5266         # uses global variable $project
5267         my ($commitlist, $from, $to, $refs, $extra) = @_;
5268
5269         $from = 0 unless defined $from;
5270         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5271
5272         print "<table class=\"shortlog\">\n";
5273         my $alternate = 1;
5274         for (my $i = $from; $i <= $to; $i++) {
5275                 my %co = %{$commitlist->[$i]};
5276                 my $commit = $co{'id'};
5277                 my $ref = format_ref_marker($refs, $commit);
5278                 if ($alternate) {
5279                         print "<tr class=\"dark\">\n";
5280                 } else {
5281                         print "<tr class=\"light\">\n";
5282                 }
5283                 $alternate ^= 1;
5284                 # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5285                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5286                       format_author_html('td', \%co, 10) . "<td>";
5287                 print format_subject_html($co{'title'}, $co{'title_short'},
5288                                           href(action=>"commit", hash=>$commit), $ref);
5289                 print "</td>\n" .
5290                       "<td class=\"link\">" .
5291                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5292                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5293                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5294                 my $snapshot_links = format_snapshot_links($commit);
5295                 if (defined $snapshot_links) {
5296                         print " | " . $snapshot_links;
5297                 }
5298                 print "</td>\n" .
5299                       "</tr>\n";
5300         }
5301         if (defined $extra) {
5302                 print "<tr>\n" .
5303                       "<td colspan=\"4\">$extra</td>\n" .
5304                       "</tr>\n";
5305         }
5306         print "</table>\n";
5307 }
5308
5309 sub git_history_body {
5310         # Warning: assumes constant type (blob or tree) during history
5311         my ($commitlist, $from, $to, $refs, $extra,
5312             $file_name, $file_hash, $ftype) = @_;
5313
5314         $from = 0 unless defined $from;
5315         $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5316
5317         print "<table class=\"history\">\n";
5318         my $alternate = 1;
5319         for (my $i = $from; $i <= $to; $i++) {
5320                 my %co = %{$commitlist->[$i]};
5321                 if (!%co) {
5322                         next;
5323                 }
5324                 my $commit = $co{'id'};
5325
5326                 my $ref = format_ref_marker($refs, $commit);
5327
5328                 if ($alternate) {
5329                         print "<tr class=\"dark\">\n";
5330                 } else {
5331                         print "<tr class=\"light\">\n";
5332                 }
5333                 $alternate ^= 1;
5334                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5335         # shortlog:   format_author_html('td', \%co, 10)
5336                       format_author_html('td', \%co, 15, 3) . "<td>";
5337                 # originally git_history used chop_str($co{'title'}, 50)
5338                 print format_subject_html($co{'title'}, $co{'title_short'},
5339                                           href(action=>"commit", hash=>$commit), $ref);
5340                 print "</td>\n" .
5341                       "<td class=\"link\">" .
5342                       $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5343                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5344
5345                 if ($ftype eq 'blob') {
5346                         my $blob_current = $file_hash;
5347                         my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5348                         if (defined $blob_current && defined $blob_parent &&
5349                                         $blob_current ne $blob_parent) {
5350                                 print " | " .
5351                                         $cgi->a({-href => href(action=>"blobdiff",
5352                                                                hash=>$blob_current, hash_parent=>$blob_parent,
5353                                                                hash_base=>$hash_base, hash_parent_base=>$commit,
5354                                                                file_name=>$file_name)},
5355                                                 "diff to current");
5356                         }
5357                 }
5358                 print "</td>\n" .
5359                       "</tr>\n";
5360         }
5361         if (defined $extra) {
5362                 print "<tr>\n" .
5363                       "<td colspan=\"4\">$extra</td>\n" .
5364                       "</tr>\n";
5365         }
5366         print "</table>\n";
5367 }
5368
5369 sub git_tags_body {
5370         # uses global variable $project
5371         my ($taglist, $from, $to, $extra) = @_;
5372         $from = 0 unless defined $from;
5373         $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5374
5375         print "<table class=\"tags\">\n";
5376         my $alternate = 1;
5377         for (my $i = $from; $i <= $to; $i++) {
5378                 my $entry = $taglist->[$i];
5379                 my %tag = %$entry;
5380                 my $comment = $tag{'subject'};
5381                 my $comment_short;
5382                 if (defined $comment) {
5383                         $comment_short = chop_str($comment, 30, 5);
5384                 }
5385                 if ($alternate) {
5386                         print "<tr class=\"dark\">\n";
5387                 } else {
5388                         print "<tr class=\"light\">\n";
5389                 }
5390                 $alternate ^= 1;
5391                 if (defined $tag{'age'}) {
5392                         print "<td><i>$tag{'age'}</i></td>\n";
5393                 } else {
5394                         print "<td></td>\n";
5395                 }
5396                 print "<td>" .
5397                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5398                                -class => "list name"}, esc_html($tag{'name'})) .
5399                       "</td>\n" .
5400                       "<td>";
5401                 if (defined $comment) {
5402                         print format_subject_html($comment, $comment_short,
5403                                                   href(action=>"tag", hash=>$tag{'id'}));
5404                 }
5405                 print "</td>\n" .
5406                       "<td class=\"selflink\">";
5407                 if ($tag{'type'} eq "tag") {
5408                         print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5409                 } else {
5410                         print "&nbsp;";
5411                 }
5412                 print "</td>\n" .
5413                       "<td class=\"link\">" . " | " .
5414                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5415                 if ($tag{'reftype'} eq "commit") {
5416                         print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5417                               " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5418                 } elsif ($tag{'reftype'} eq "blob") {
5419                         print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5420                 }
5421                 print "</td>\n" .
5422                       "</tr>";
5423         }
5424         if (defined $extra) {
5425                 print "<tr>\n" .
5426                       "<td colspan=\"5\">$extra</td>\n" .
5427                       "</tr>\n";
5428         }
5429         print "</table>\n";
5430 }
5431
5432 sub git_heads_body {
5433         # uses global variable $project
5434         my ($headlist, $head, $from, $to, $extra) = @_;
5435         $from = 0 unless defined $from;
5436         $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5437
5438         print "<table class=\"heads\">\n";
5439         my $alternate = 1;
5440         for (my $i = $from; $i <= $to; $i++) {
5441                 my $entry = $headlist->[$i];
5442                 my %ref = %$entry;
5443                 my $curr = $ref{'id'} eq $head;
5444                 if ($alternate) {
5445                         print "<tr class=\"dark\">\n";
5446                 } else {
5447                         print "<tr class=\"light\">\n";
5448                 }
5449                 $alternate ^= 1;
5450                 print "<td><i>$ref{'age'}</i></td>\n" .
5451                       ($curr ? "<td class=\"current_head\">" : "<td>") .
5452                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5453                                -class => "list name"},esc_html($ref{'name'})) .
5454                       "</td>\n" .
5455                       "<td class=\"link\">" .
5456                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5457                       $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5458                       $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5459                       "</td>\n" .
5460                       "</tr>";
5461         }
5462         if (defined $extra) {
5463                 print "<tr>\n" .
5464                       "<td colspan=\"3\">$extra</td>\n" .
5465                       "</tr>\n";
5466         }
5467         print "</table>\n";
5468 }
5469
5470 # Display a single remote block
5471 sub git_remote_block {
5472         my ($remote, $rdata, $limit, $head) = @_;
5473
5474         my $heads = $rdata->{'heads'};
5475         my $fetch = $rdata->{'fetch'};
5476         my $push = $rdata->{'push'};
5477
5478         my $urls_table = "<table class=\"projects_list\">\n" ;
5479
5480         if (defined $fetch) {
5481                 if ($fetch eq $push) {
5482                         $urls_table .= format_repo_url("URL", $fetch);
5483                 } else {
5484                         $urls_table .= format_repo_url("Fetch URL", $fetch);
5485                         $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5486                 }
5487         } elsif (defined $push) {
5488                 $urls_table .= format_repo_url("Push URL", $push);
5489         } else {
5490                 $urls_table .= format_repo_url("", "No remote URL");
5491         }
5492
5493         $urls_table .= "</table>\n";
5494
5495         my $dots;
5496         if (defined $limit && $limit < @$heads) {
5497                 $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5498         }
5499
5500         print $urls_table;
5501         git_heads_body($heads, $head, 0, $limit, $dots);
5502 }
5503
5504 # Display a list of remote names with the respective fetch and push URLs
5505 sub git_remotes_list {
5506         my ($remotedata, $limit) = @_;
5507         print "<table class=\"heads\">\n";
5508         my $alternate = 1;
5509         my @remotes = sort keys %$remotedata;
5510
5511         my $limited = $limit && $limit < @remotes;
5512
5513         $#remotes = $limit - 1 if $limited;
5514
5515         while (my $remote = shift @remotes) {
5516                 my $rdata = $remotedata->{$remote};
5517                 my $fetch = $rdata->{'fetch'};
5518                 my $push = $rdata->{'push'};
5519                 if ($alternate) {
5520                         print "<tr class=\"dark\">\n";
5521                 } else {
5522                         print "<tr class=\"light\">\n";
5523                 }
5524                 $alternate ^= 1;
5525                 print "<td>" .
5526                       $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5527                                -class=> "list name"},esc_html($remote)) .
5528                       "</td>";
5529                 print "<td class=\"link\">" .
5530                       (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5531                       " | " .
5532                       (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5533                       "</td>";
5534
5535                 print "</tr>\n";
5536         }
5537
5538         if ($limited) {
5539                 print "<tr>\n" .
5540                       "<td colspan=\"3\">" .
5541                       $cgi->a({-href => href(action=>"remotes")}, "...") .
5542                       "</td>\n" . "</tr>\n";
5543         }
5544
5545         print "</table>";
5546 }
5547
5548 # Display remote heads grouped by remote, unless there are too many
5549 # remotes, in which case we only display the remote names
5550 sub git_remotes_body {
5551         my ($remotedata, $limit, $head) = @_;
5552         if ($limit and $limit < keys %$remotedata) {
5553                 git_remotes_list($remotedata, $limit);
5554         } else {
5555                 fill_remote_heads($remotedata);
5556                 while (my ($remote, $rdata) = each %$remotedata) {
5557                         git_print_section({-class=>"remote", -id=>$remote},
5558                                 ["remotes", $remote, $remote], sub {
5559                                         git_remote_block($remote, $rdata, $limit, $head);
5560                                 });
5561                 }
5562         }
5563 }
5564
5565 sub git_search_message {
5566         my %co = @_;
5567
5568         my $greptype;
5569         if ($searchtype eq 'commit') {
5570                 $greptype = "--grep=";
5571         } elsif ($searchtype eq 'author') {
5572                 $greptype = "--author=";
5573         } elsif ($searchtype eq 'committer') {
5574                 $greptype = "--committer=";
5575         }
5576         $greptype .= $searchtext;
5577         my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
5578                                        $greptype, '--regexp-ignore-case',
5579                                        $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
5580
5581         my $paging_nav = '';
5582         if ($page > 0) {
5583                 $paging_nav .=
5584                         $cgi->a({-href => href(-replay=>1, page=>undef)},
5585                                 "first") .
5586                         " &sdot; " .
5587                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
5588                                  -accesskey => "p", -title => "Alt-p"}, "prev");
5589         } else {
5590                 $paging_nav .= "first &sdot; prev";
5591         }
5592         my $next_link = '';
5593         if ($#commitlist >= 100) {
5594                 $next_link =
5595                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
5596                                  -accesskey => "n", -title => "Alt-n"}, "next");
5597                 $paging_nav .= " &sdot; $next_link";
5598         } else {
5599                 $paging_nav .= " &sdot; next";
5600         }
5601
5602         git_header_html();
5603
5604         git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
5605         git_print_header_div('commit', esc_html($co{'title'}), $hash);
5606         if ($page == 0 && !@commitlist) {
5607                 print "<p>No match.</p>\n";
5608         } else {
5609                 git_search_grep_body(\@commitlist, 0, 99, $next_link);
5610         }
5611
5612         git_footer_html();
5613 }
5614
5615 sub git_search_changes {
5616         my %co = @_;
5617
5618         local $/ = "\n";
5619         open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
5620                 '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
5621                 ($search_use_regexp ? '--pickaxe-regex' : ())
5622                         or die_error(500, "Open git-log failed");
5623
5624         git_header_html();
5625
5626         git_print_page_nav('','', $hash,$co{'tree'},$hash);
5627         git_print_header_div('commit', esc_html($co{'title'}), $hash);
5628
5629         print "<table class=\"pickaxe search\">\n";
5630         my $alternate = 1;
5631         undef %co;
5632         my @files;
5633         while (my $line = <$fd>) {
5634                 chomp $line;
5635                 next unless $line;
5636
5637                 my %set = parse_difftree_raw_line($line);
5638                 if (defined $set{'commit'}) {
5639                         # finish previous commit
5640                         if (%co) {
5641                                 print "</td>\n" .
5642                                       "<td class=\"link\">" .
5643                                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5644                                               "commit") .
5645                                       " | " .
5646                                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5647                                                              hash_base=>$co{'id'})},
5648                                               "tree") .
5649                                       "</td>\n" .
5650                                       "</tr>\n";
5651                         }
5652
5653                         if ($alternate) {
5654                                 print "<tr class=\"dark\">\n";
5655                         } else {
5656                                 print "<tr class=\"light\">\n";
5657                         }
5658                         $alternate ^= 1;
5659                         %co = parse_commit($set{'commit'});
5660                         my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
5661                         print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5662                               "<td><i>$author</i></td>\n" .
5663                               "<td>" .
5664                               $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5665                                       -class => "list subject"},
5666                                       chop_and_escape_str($co{'title'}, 50) . "<br/>");
5667                 } elsif (defined $set{'to_id'}) {
5668                         next if ($set{'to_id'} =~ m/^0{40}$/);
5669
5670                         print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
5671                                                      hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
5672                                       -class => "list"},
5673                                       "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
5674                               "<br/>\n";
5675                 }
5676         }
5677         close $fd;
5678
5679         # finish last commit (warning: repetition!)
5680         if (%co) {
5681                 print "</td>\n" .
5682                       "<td class=\"link\">" .
5683                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5684                               "commit") .
5685                       " | " .
5686                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5687                                              hash_base=>$co{'id'})},
5688                               "tree") .
5689                       "</td>\n" .
5690                       "</tr>\n";
5691         }
5692
5693         print "</table>\n";
5694
5695         git_footer_html();
5696 }
5697
5698 sub git_search_files {
5699         my %co = @_;
5700
5701         local $/ = "\n";
5702         open my $fd, "-|", git_cmd(), 'grep', '-n',
5703                 $search_use_regexp ? ('-E', '-i') : '-F',
5704                 $searchtext, $co{'tree'}
5705                         or die_error(500, "Open git-grep failed");
5706
5707         git_header_html();
5708
5709         git_print_page_nav('','', $hash,$co{'tree'},$hash);
5710         git_print_header_div('commit', esc_html($co{'title'}), $hash);
5711
5712         print "<table class=\"grep_search\">\n";
5713         my $alternate = 1;
5714         my $matches = 0;
5715         my $lastfile = '';
5716         while (my $line = <$fd>) {
5717                 chomp $line;
5718                 my ($file, $lno, $ltext, $binary);
5719                 last if ($matches++ > 1000);
5720                 if ($line =~ /^Binary file (.+) matches$/) {
5721                         $file = $1;
5722                         $binary = 1;
5723                 } else {
5724                         (undef, $file, $lno, $ltext) = split(/:/, $line, 4);
5725                 }
5726                 if ($file ne $lastfile) {
5727                         $lastfile and print "</td></tr>\n";
5728                         if ($alternate++) {
5729                                 print "<tr class=\"dark\">\n";
5730                         } else {
5731                                 print "<tr class=\"light\">\n";
5732                         }
5733                         print "<td class=\"list\">".
5734                                 $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
5735                                                        file_name=>"$file"),
5736                                         -class => "list"}, esc_path($file));
5737                         print "</td><td>\n";
5738                         $lastfile = $file;
5739                 }
5740                 if ($binary) {
5741                         print "<div class=\"binary\">Binary file</div>\n";
5742                 } else {
5743                         $ltext = untabify($ltext);
5744                         if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
5745                                 $ltext = esc_html($1, -nbsp=>1);
5746                                 $ltext .= '<span class="match">';
5747                                 $ltext .= esc_html($2, -nbsp=>1);
5748                                 $ltext .= '</span>';
5749                                 $ltext .= esc_html($3, -nbsp=>1);
5750                         } else {
5751                                 $ltext = esc_html($ltext, -nbsp=>1);
5752                         }
5753                         print "<div class=\"pre\">" .
5754                                 $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
5755                                                        file_name=>"$file").'#l'.$lno,
5756                                         -class => "linenr"}, sprintf('%4i', $lno))
5757                                 . ' ' .  $ltext . "</div>\n";
5758                 }
5759         }
5760         if ($lastfile) {
5761                 print "</td></tr>\n";
5762                 if ($matches > 1000) {
5763                         print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
5764                 }
5765         } else {
5766                 print "<div class=\"diff nodifferences\">No matches found</div>\n";
5767         }
5768         close $fd;
5769
5770         print "</table>\n";
5771
5772         git_footer_html();
5773 }
5774
5775 sub git_search_grep_body {
5776         my ($commitlist, $from, $to, $extra) = @_;
5777         $from = 0 unless defined $from;
5778         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5779
5780         print "<table class=\"commit_search\">\n";
5781         my $alternate = 1;
5782         for (my $i = $from; $i <= $to; $i++) {
5783                 my %co = %{$commitlist->[$i]};
5784                 if (!%co) {
5785                         next;
5786                 }
5787                 my $commit = $co{'id'};
5788                 if ($alternate) {
5789                         print "<tr class=\"dark\">\n";
5790                 } else {
5791                         print "<tr class=\"light\">\n";
5792                 }
5793                 $alternate ^= 1;
5794                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5795                       format_author_html('td', \%co, 15, 5) .
5796                       "<td>" .
5797                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5798                                -class => "list subject"},
5799                               chop_and_escape_str($co{'title'}, 50) . "<br/>");
5800                 my $comment = $co{'comment'};
5801                 foreach my $line (@$comment) {
5802                         if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
5803                                 my ($lead, $match, $trail) = ($1, $2, $3);
5804                                 $match = chop_str($match, 70, 5, 'center');
5805                                 my $contextlen = int((80 - length($match))/2);
5806                                 $contextlen = 30 if ($contextlen > 30);
5807                                 $lead  = chop_str($lead,  $contextlen, 10, 'left');
5808                                 $trail = chop_str($trail, $contextlen, 10, 'right');
5809
5810                                 $lead  = esc_html($lead);
5811                                 $match = esc_html($match);
5812                                 $trail = esc_html($trail);
5813
5814                                 print "$lead<span class=\"match\">$match</span>$trail<br />";
5815                         }
5816                 }
5817                 print "</td>\n" .
5818                       "<td class=\"link\">" .
5819                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5820                       " | " .
5821                       $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5822                       " | " .
5823                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5824                 print "</td>\n" .
5825                       "</tr>\n";
5826         }
5827         if (defined $extra) {
5828                 print "<tr>\n" .
5829                       "<td colspan=\"3\">$extra</td>\n" .
5830                       "</tr>\n";
5831         }
5832         print "</table>\n";
5833 }
5834
5835 ## ======================================================================
5836 ## ======================================================================
5837 ## actions
5838
5839 sub git_project_list {
5840         my $order = $input_params{'order'};
5841         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5842                 die_error(400, "Unknown order parameter");
5843         }
5844
5845         my @list = git_get_projects_list();
5846         if (!@list) {
5847                 die_error(404, "No projects found");
5848         }
5849
5850         git_header_html();
5851         if (defined $home_text && -f $home_text) {
5852                 print "<div class=\"index_include\">\n";
5853                 insert_file($home_text);
5854                 print "</div>\n";
5855         }
5856         print $cgi->startform(-method => "get") .
5857               "<p class=\"projsearch\">Search:\n" .
5858               $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
5859               "</p>" .
5860               $cgi->end_form() . "\n";
5861         git_project_list_body(\@list, $order);
5862         git_footer_html();
5863 }
5864
5865 sub git_forks {
5866         my $order = $input_params{'order'};
5867         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5868                 die_error(400, "Unknown order parameter");
5869         }
5870
5871         my @list = git_get_projects_list($project);
5872         if (!@list) {
5873                 die_error(404, "No forks found");
5874         }
5875
5876         git_header_html();
5877         git_print_page_nav('','');
5878         git_print_header_div('summary', "$project forks");
5879         git_project_list_body(\@list, $order);
5880         git_footer_html();
5881 }
5882
5883 sub git_project_index {
5884         my @projects = git_get_projects_list();
5885         if (!@projects) {
5886                 die_error(404, "No projects found");
5887         }
5888
5889         print $cgi->header(
5890                 -type => 'text/plain',
5891                 -charset => 'utf-8',
5892                 -content_disposition => 'inline; filename="index.aux"');
5893
5894         foreach my $pr (@projects) {
5895                 if (!exists $pr->{'owner'}) {
5896                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
5897                 }
5898
5899                 my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
5900                 # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
5901                 $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5902                 $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5903                 $path  =~ s/ /\+/g;
5904                 $owner =~ s/ /\+/g;
5905
5906                 print "$path $owner\n";
5907         }
5908 }
5909
5910 sub git_summary {
5911         my $descr = git_get_project_description($project) || "none";
5912         my %co = parse_commit("HEAD");
5913         my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
5914         my $head = $co{'id'};
5915         my $remote_heads = gitweb_check_feature('remote_heads');
5916
5917         my $owner = git_get_project_owner($project);
5918
5919         my $refs = git_get_references();
5920         # These get_*_list functions return one more to allow us to see if
5921         # there are more ...
5922         my @taglist  = git_get_tags_list(16);
5923         my @headlist = git_get_heads_list(16);
5924         my %remotedata = $remote_heads ? git_get_remotes_list() : ();
5925         my @forklist;
5926         my $check_forks = gitweb_check_feature('forks');
5927
5928         if ($check_forks) {
5929                 # find forks of a project
5930                 @forklist = git_get_projects_list($project);
5931                 # filter out forks of forks
5932                 @forklist = filter_forks_from_projects_list(\@forklist)
5933                         if (@forklist);
5934         }
5935
5936         git_header_html();
5937         git_print_page_nav('summary','', $head);
5938
5939         print "<div class=\"title\">&nbsp;</div>\n";
5940         print "<table class=\"projects_list\">\n" .
5941               "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
5942               "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
5943         if (defined $cd{'rfc2822'}) {
5944                 print "<tr id=\"metadata_lchange\"><td>last change</td>" .
5945                       "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
5946         }
5947
5948         # use per project git URL list in $projectroot/$project/cloneurl
5949         # or make project git URL from git base URL and project name
5950         my $url_tag = "URL";
5951         my @url_list = git_get_project_url_list($project);
5952         @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
5953         foreach my $git_url (@url_list) {
5954                 next unless $git_url;
5955                 print format_repo_url($url_tag, $git_url);
5956                 $url_tag = "";
5957         }
5958
5959         # Tag cloud
5960         my $show_ctags = gitweb_check_feature('ctags');
5961         if ($show_ctags) {
5962                 my $ctags = git_get_project_ctags($project);
5963                 if (%$ctags) {
5964                         # without ability to add tags, don't show if there are none
5965                         my $cloud = git_populate_project_tagcloud($ctags);
5966                         print "<tr id=\"metadata_ctags\">" .
5967                               "<td>content tags</td>" .
5968                               "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
5969                               "</tr>\n";
5970                 }
5971         }
5972
5973         print "</table>\n";
5974
5975         # If XSS prevention is on, we don't include README.html.
5976         # TODO: Allow a readme in some safe format.
5977         if (!$prevent_xss && -s "$projectroot/$project/README.html") {
5978                 print "<div class=\"title\">readme</div>\n" .
5979                       "<div class=\"readme\">\n";
5980                 insert_file("$projectroot/$project/README.html");
5981                 print "\n</div>\n"; # class="readme"
5982         }
5983
5984         # we need to request one more than 16 (0..15) to check if
5985         # those 16 are all
5986         my @commitlist = $head ? parse_commits($head, 17) : ();
5987         if (@commitlist) {
5988                 git_print_header_div('shortlog');
5989                 git_shortlog_body(\@commitlist, 0, 15, $refs,
5990                                   $#commitlist <=  15 ? undef :
5991                                   $cgi->a({-href => href(action=>"shortlog")}, "..."));
5992         }
5993
5994         if (@taglist) {
5995                 git_print_header_div('tags');
5996                 git_tags_body(\@taglist, 0, 15,
5997                               $#taglist <=  15 ? undef :
5998                               $cgi->a({-href => href(action=>"tags")}, "..."));
5999         }
6000
6001         if (@headlist) {
6002                 git_print_header_div('heads');
6003                 git_heads_body(\@headlist, $head, 0, 15,
6004                                $#headlist <= 15 ? undef :
6005                                $cgi->a({-href => href(action=>"heads")}, "..."));
6006         }
6007
6008         if (%remotedata) {
6009                 git_print_header_div('remotes');
6010                 git_remotes_body(\%remotedata, 15, $head);
6011         }
6012
6013         if (@forklist) {
6014                 git_print_header_div('forks');
6015                 git_project_list_body(\@forklist, 'age', 0, 15,
6016                                       $#forklist <= 15 ? undef :
6017                                       $cgi->a({-href => href(action=>"forks")}, "..."),
6018                                       'no_header');
6019         }
6020
6021         git_footer_html();
6022 }
6023
6024 sub git_tag {
6025         my %tag = parse_tag($hash);
6026
6027         if (! %tag) {
6028                 die_error(404, "Unknown tag object");
6029         }
6030
6031         my $head = git_get_head_hash($project);
6032         git_header_html();
6033         git_print_page_nav('','', $head,undef,$head);
6034         git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6035         print "<div class=\"title_text\">\n" .
6036               "<table class=\"object_header\">\n" .
6037               "<tr>\n" .
6038               "<td>object</td>\n" .
6039               "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6040                                $tag{'object'}) . "</td>\n" .
6041               "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6042                                               $tag{'type'}) . "</td>\n" .
6043               "</tr>\n";
6044         if (defined($tag{'author'})) {
6045                 git_print_authorship_rows(\%tag, 'author');
6046         }
6047         print "</table>\n\n" .
6048               "</div>\n";
6049         print "<div class=\"page_body\">";
6050         my $comment = $tag{'comment'};
6051         foreach my $line (@$comment) {
6052                 chomp $line;
6053                 print esc_html($line, -nbsp=>1) . "<br/>\n";
6054         }
6055         print "</div>\n";
6056         git_footer_html();
6057 }
6058
6059 sub git_blame_common {
6060         my $format = shift || 'porcelain';
6061         if ($format eq 'porcelain' && $cgi->param('js')) {
6062                 $format = 'incremental';
6063                 $action = 'blame_incremental'; # for page title etc
6064         }
6065
6066         # permissions
6067         gitweb_check_feature('blame')
6068                 or die_error(403, "Blame view not allowed");
6069
6070         # error checking
6071         die_error(400, "No file name given") unless $file_name;
6072         $hash_base ||= git_get_head_hash($project);
6073         die_error(404, "Couldn't find base commit") unless $hash_base;
6074         my %co = parse_commit($hash_base)
6075                 or die_error(404, "Commit not found");
6076         my $ftype = "blob";
6077         if (!defined $hash) {
6078                 $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6079                         or die_error(404, "Error looking up file");
6080         } else {
6081                 $ftype = git_get_type($hash);
6082                 if ($ftype !~ "blob") {
6083                         die_error(400, "Object is not a blob");
6084                 }
6085         }
6086
6087         my $fd;
6088         if ($format eq 'incremental') {
6089                 # get file contents (as base)
6090                 open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6091                         or die_error(500, "Open git-cat-file failed");
6092         } elsif ($format eq 'data') {
6093                 # run git-blame --incremental
6094                 open $fd, "-|", git_cmd(), "blame", "--incremental",
6095                         $hash_base, "--", $file_name
6096                         or die_error(500, "Open git-blame --incremental failed");
6097         } else {
6098                 # run git-blame --porcelain
6099                 open $fd, "-|", git_cmd(), "blame", '-p',
6100                         $hash_base, '--', $file_name
6101                         or die_error(500, "Open git-blame --porcelain failed");
6102         }
6103
6104         # incremental blame data returns early
6105         if ($format eq 'data') {
6106                 print $cgi->header(
6107                         -type=>"text/plain", -charset => "utf-8",
6108                         -status=> "200 OK");
6109                 local $| = 1; # output autoflush
6110                 print while <$fd>;
6111                 close $fd
6112                         or print "ERROR $!\n";
6113
6114                 print 'END';
6115                 if (defined $t0 && gitweb_check_feature('timed')) {
6116                         print ' '.
6117                               tv_interval($t0, [ gettimeofday() ]).
6118                               ' '.$number_of_git_cmds;
6119                 }
6120                 print "\n";
6121
6122                 return;
6123         }
6124
6125         # page header
6126         git_header_html();
6127         my $formats_nav =
6128                 $cgi->a({-href => href(action=>"blob", -replay=>1)},
6129                         "blob") .
6130                 " | ";
6131         if ($format eq 'incremental') {
6132                 $formats_nav .=
6133                         $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6134                                 "blame") . " (non-incremental)";
6135         } else {
6136                 $formats_nav .=
6137                         $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6138                                 "blame") . " (incremental)";
6139         }
6140         $formats_nav .=
6141                 " | " .
6142                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6143                         "history") .
6144                 " | " .
6145                 $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6146                         "HEAD");
6147         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6148         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6149         git_print_page_path($file_name, $ftype, $hash_base);
6150
6151         # page body
6152         if ($format eq 'incremental') {
6153                 print "<noscript>\n<div class=\"error\"><center><b>\n".
6154                       "This page requires JavaScript to run.\n Use ".
6155                       $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6156                               'this page').
6157                       " instead.\n".
6158                       "</b></center></div>\n</noscript>\n";
6159
6160                 print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6161         }
6162
6163         print qq!<div class="page_body">\n!;
6164         print qq!<div id="progress_info">... / ...</div>\n!
6165                 if ($format eq 'incremental');
6166         print qq!<table id="blame_table" class="blame" width="100%">\n!.
6167               #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6168               qq!<thead>\n!.
6169               qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6170               qq!</thead>\n!.
6171               qq!<tbody>\n!;
6172
6173         my @rev_color = qw(light dark);
6174         my $num_colors = scalar(@rev_color);
6175         my $current_color = 0;
6176
6177         if ($format eq 'incremental') {
6178                 my $color_class = $rev_color[$current_color];
6179
6180                 #contents of a file
6181                 my $linenr = 0;
6182         LINE:
6183                 while (my $line = <$fd>) {
6184                         chomp $line;
6185                         $linenr++;
6186
6187                         print qq!<tr id="l$linenr" class="$color_class">!.
6188                               qq!<td class="sha1"><a href=""> </a></td>!.
6189                               qq!<td class="linenr">!.
6190                               qq!<a class="linenr" href="">$linenr</a></td>!;
6191                         print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6192                         print qq!</tr>\n!;
6193                 }
6194
6195         } else { # porcelain, i.e. ordinary blame
6196                 my %metainfo = (); # saves information about commits
6197
6198                 # blame data
6199         LINE:
6200                 while (my $line = <$fd>) {
6201                         chomp $line;
6202                         # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6203                         # no <lines in group> for subsequent lines in group of lines
6204                         my ($full_rev, $orig_lineno, $lineno, $group_size) =
6205                            ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6206                         if (!exists $metainfo{$full_rev}) {
6207                                 $metainfo{$full_rev} = { 'nprevious' => 0 };
6208                         }
6209                         my $meta = $metainfo{$full_rev};
6210                         my $data;
6211                         while ($data = <$fd>) {
6212                                 chomp $data;
6213                                 last if ($data =~ s/^\t//); # contents of line
6214                                 if ($data =~ /^(\S+)(?: (.*))?$/) {
6215                                         $meta->{$1} = $2 unless exists $meta->{$1};
6216                                 }
6217                                 if ($data =~ /^previous /) {
6218                                         $meta->{'nprevious'}++;
6219                                 }
6220                         }
6221                         my $short_rev = substr($full_rev, 0, 8);
6222                         my $author = $meta->{'author'};
6223                         my %date =
6224                                 parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6225                         my $date = $date{'iso-tz'};
6226                         if ($group_size) {
6227                                 $current_color = ($current_color + 1) % $num_colors;
6228                         }
6229                         my $tr_class = $rev_color[$current_color];
6230                         $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6231                         $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6232                         $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6233                         print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6234                         if ($group_size) {
6235                                 print "<td class=\"sha1\"";
6236                                 print " title=\"". esc_html($author) . ", $date\"";
6237                                 print " rowspan=\"$group_size\"" if ($group_size > 1);
6238                                 print ">";
6239                                 print $cgi->a({-href => href(action=>"commit",
6240                                                              hash=>$full_rev,
6241                                                              file_name=>$file_name)},
6242                                               esc_html($short_rev));
6243                                 if ($group_size >= 2) {
6244                                         my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6245                                         if (@author_initials) {
6246                                                 print "<br />" .
6247                                                       esc_html(join('', @author_initials));
6248                                                 #           or join('.', ...)
6249                                         }
6250                                 }
6251                                 print "</td>\n";
6252                         }
6253                         # 'previous' <sha1 of parent commit> <filename at commit>
6254                         if (exists $meta->{'previous'} &&
6255                             $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6256                                 $meta->{'parent'} = $1;
6257                                 $meta->{'file_parent'} = unquote($2);
6258                         }
6259                         my $linenr_commit =
6260                                 exists($meta->{'parent'}) ?
6261                                 $meta->{'parent'} : $full_rev;
6262                         my $linenr_filename =
6263                                 exists($meta->{'file_parent'}) ?
6264                                 $meta->{'file_parent'} : unquote($meta->{'filename'});
6265                         my $blamed = href(action => 'blame',
6266                                           file_name => $linenr_filename,
6267                                           hash_base => $linenr_commit);
6268                         print "<td class=\"linenr\">";
6269                         print $cgi->a({ -href => "$blamed#l$orig_lineno",
6270                                         -class => "linenr" },
6271                                       esc_html($lineno));
6272                         print "</td>";
6273                         print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6274                         print "</tr>\n";
6275                 } # end while
6276
6277         }
6278
6279         # footer
6280         print "</tbody>\n".
6281               "</table>\n"; # class="blame"
6282         print "</div>\n";   # class="blame_body"
6283         close $fd
6284                 or print "Reading blob failed\n";
6285
6286         git_footer_html();
6287 }
6288
6289 sub git_blame {
6290         git_blame_common();
6291 }
6292
6293 sub git_blame_incremental {
6294         git_blame_common('incremental');
6295 }
6296
6297 sub git_blame_data {
6298         git_blame_common('data');
6299 }
6300
6301 sub git_tags {
6302         my $head = git_get_head_hash($project);
6303         git_header_html();
6304         git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6305         git_print_header_div('summary', $project);
6306
6307         my @tagslist = git_get_tags_list();
6308         if (@tagslist) {
6309                 git_tags_body(\@tagslist);
6310         }
6311         git_footer_html();
6312 }
6313
6314 sub git_heads {
6315         my $head = git_get_head_hash($project);
6316         git_header_html();
6317         git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6318         git_print_header_div('summary', $project);
6319
6320         my @headslist = git_get_heads_list();
6321         if (@headslist) {
6322                 git_heads_body(\@headslist, $head);
6323         }
6324         git_footer_html();
6325 }
6326
6327 # used both for single remote view and for list of all the remotes
6328 sub git_remotes {
6329         gitweb_check_feature('remote_heads')
6330                 or die_error(403, "Remote heads view is disabled");
6331
6332         my $head = git_get_head_hash($project);
6333         my $remote = $input_params{'hash'};
6334
6335         my $remotedata = git_get_remotes_list($remote);
6336         die_error(500, "Unable to get remote information") unless defined $remotedata;
6337
6338         unless (%$remotedata) {
6339                 die_error(404, defined $remote ?
6340                         "Remote $remote not found" :
6341                         "No remotes found");
6342         }
6343
6344         git_header_html(undef, undef, -action_extra => $remote);
6345         git_print_page_nav('', '',  $head, undef, $head,
6346                 format_ref_views($remote ? '' : 'remotes'));
6347
6348         fill_remote_heads($remotedata);
6349         if (defined $remote) {
6350                 git_print_header_div('remotes', "$remote remote for $project");
6351                 git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6352         } else {
6353                 git_print_header_div('summary', "$project remotes");
6354                 git_remotes_body($remotedata, undef, $head);
6355         }
6356
6357         git_footer_html();
6358 }
6359
6360 sub git_blob_plain {
6361         my $type = shift;
6362         my $expires;
6363
6364         if (!defined $hash) {
6365                 if (defined $file_name) {
6366                         my $base = $hash_base || git_get_head_hash($project);
6367                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6368                                 or die_error(404, "Cannot find file");
6369                 } else {
6370                         die_error(400, "No file name defined");
6371                 }
6372         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6373                 # blobs defined by non-textual hash id's can be cached
6374                 $expires = "+1d";
6375         }
6376
6377         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6378                 or die_error(500, "Open git-cat-file blob '$hash' failed");
6379
6380         # content-type (can include charset)
6381         $type = blob_contenttype($fd, $file_name, $type);
6382
6383         # "save as" filename, even when no $file_name is given
6384         my $save_as = "$hash";
6385         if (defined $file_name) {
6386                 $save_as = $file_name;
6387         } elsif ($type =~ m/^text\//) {
6388                 $save_as .= '.txt';
6389         }
6390
6391         # With XSS prevention on, blobs of all types except a few known safe
6392         # ones are served with "Content-Disposition: attachment" to make sure
6393         # they don't run in our security domain.  For certain image types,
6394         # blob view writes an <img> tag referring to blob_plain view, and we
6395         # want to be sure not to break that by serving the image as an
6396         # attachment (though Firefox 3 doesn't seem to care).
6397         my $sandbox = $prevent_xss &&
6398                 $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6399
6400         # serve text/* as text/plain
6401         if ($prevent_xss &&
6402             ($type =~ m!^text/[a-z]+\b(.*)$! ||
6403              ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
6404                 my $rest = $1;
6405                 $rest = defined $rest ? $rest : '';
6406                 $type = "text/plain$rest";
6407         }
6408
6409         print $cgi->header(
6410                 -type => $type,
6411                 -expires => $expires,
6412                 -content_disposition =>
6413                         ($sandbox ? 'attachment' : 'inline')
6414                         . '; filename="' . $save_as . '"');
6415         local $/ = undef;
6416         binmode STDOUT, ':raw';
6417         print <$fd>;
6418         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6419         close $fd;
6420 }
6421
6422 sub git_blob {
6423         my $expires;
6424
6425         if (!defined $hash) {
6426                 if (defined $file_name) {
6427                         my $base = $hash_base || git_get_head_hash($project);
6428                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6429                                 or die_error(404, "Cannot find file");
6430                 } else {
6431                         die_error(400, "No file name defined");
6432                 }
6433         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6434                 # blobs defined by non-textual hash id's can be cached
6435                 $expires = "+1d";
6436         }
6437
6438         my $have_blame = gitweb_check_feature('blame');
6439         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6440                 or die_error(500, "Couldn't cat $file_name, $hash");
6441         my $mimetype = blob_mimetype($fd, $file_name);
6442         # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6443         if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6444                 close $fd;
6445                 return git_blob_plain($mimetype);
6446         }
6447         # we can have blame only for text/* mimetype
6448         $have_blame &&= ($mimetype =~ m!^text/!);
6449
6450         my $highlight = gitweb_check_feature('highlight');
6451         my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6452         $fd = run_highlighter($fd, $highlight, $syntax)
6453                 if $syntax;
6454
6455         git_header_html(undef, $expires);
6456         my $formats_nav = '';
6457         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6458                 if (defined $file_name) {
6459                         if ($have_blame) {
6460                                 $formats_nav .=
6461                                         $cgi->a({-href => href(action=>"blame", -replay=>1)},
6462                                                 "blame") .
6463                                         " | ";
6464                         }
6465                         $formats_nav .=
6466                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6467                                         "history") .
6468                                 " | " .
6469                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6470                                         "raw") .
6471                                 " | " .
6472                                 $cgi->a({-href => href(action=>"blob",
6473                                                        hash_base=>"HEAD", file_name=>$file_name)},
6474                                         "HEAD");
6475                 } else {
6476                         $formats_nav .=
6477                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6478                                         "raw");
6479                 }
6480                 git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6481                 git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6482         } else {
6483                 print "<div class=\"page_nav\">\n" .
6484                       "<br/><br/></div>\n" .
6485                       "<div class=\"title\">".esc_html($hash)."</div>\n";
6486         }
6487         git_print_page_path($file_name, "blob", $hash_base);
6488         print "<div class=\"page_body\">\n";
6489         if ($mimetype =~ m!^image/!) {
6490                 print qq!<img type="!.esc_attr($mimetype).qq!"!;
6491                 if ($file_name) {
6492                         print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
6493                 }
6494                 print qq! src="! .
6495                       href(action=>"blob_plain", hash=>$hash,
6496                            hash_base=>$hash_base, file_name=>$file_name) .
6497                       qq!" />\n!;
6498         } else {
6499                 my $nr;
6500                 while (my $line = <$fd>) {
6501                         chomp $line;
6502                         $nr++;
6503                         $line = untabify($line);
6504                         printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
6505                                $nr, esc_attr(href(-replay => 1)), $nr, $nr,
6506                                $syntax ? sanitize($line) : esc_html($line, -nbsp=>1);
6507                 }
6508         }
6509         close $fd
6510                 or print "Reading blob failed.\n";
6511         print "</div>";
6512         git_footer_html();
6513 }
6514
6515 sub git_tree {
6516         if (!defined $hash_base) {
6517                 $hash_base = "HEAD";
6518         }
6519         if (!defined $hash) {
6520                 if (defined $file_name) {
6521                         $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
6522                 } else {
6523                         $hash = $hash_base;
6524                 }
6525         }
6526         die_error(404, "No such tree") unless defined($hash);
6527
6528         my $show_sizes = gitweb_check_feature('show-sizes');
6529         my $have_blame = gitweb_check_feature('blame');
6530
6531         my @entries = ();
6532         {
6533                 local $/ = "\0";
6534                 open my $fd, "-|", git_cmd(), "ls-tree", '-z',
6535                         ($show_sizes ? '-l' : ()), @extra_options, $hash
6536                         or die_error(500, "Open git-ls-tree failed");
6537                 @entries = map { chomp; $_ } <$fd>;
6538                 close $fd
6539                         or die_error(404, "Reading tree failed");
6540         }
6541
6542         my $refs = git_get_references();
6543         my $ref = format_ref_marker($refs, $hash_base);
6544         git_header_html();
6545         my $basedir = '';
6546         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6547                 my @views_nav = ();
6548                 if (defined $file_name) {
6549                         push @views_nav,
6550                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6551                                         "history"),
6552                                 $cgi->a({-href => href(action=>"tree",
6553                                                        hash_base=>"HEAD", file_name=>$file_name)},
6554                                         "HEAD"),
6555                 }
6556                 my $snapshot_links = format_snapshot_links($hash);
6557                 if (defined $snapshot_links) {
6558                         # FIXME: Should be available when we have no hash base as well.
6559                         push @views_nav, $snapshot_links;
6560                 }
6561                 git_print_page_nav('tree','', $hash_base, undef, undef,
6562                                    join(' | ', @views_nav));
6563                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6564         } else {
6565                 undef $hash_base;
6566                 print "<div class=\"page_nav\">\n";
6567                 print "<br/><br/></div>\n";
6568                 print "<div class=\"title\">".esc_html($hash)."</div>\n";
6569         }
6570         if (defined $file_name) {
6571                 $basedir = $file_name;
6572                 if ($basedir ne '' && substr($basedir, -1) ne '/') {
6573                         $basedir .= '/';
6574                 }
6575                 git_print_page_path($file_name, 'tree', $hash_base);
6576         }
6577         print "<div class=\"page_body\">\n";
6578         print "<table class=\"tree\">\n";
6579         my $alternate = 1;
6580         # '..' (top directory) link if possible
6581         if (defined $hash_base &&
6582             defined $file_name && $file_name =~ m![^/]+$!) {
6583                 if ($alternate) {
6584                         print "<tr class=\"dark\">\n";
6585                 } else {
6586                         print "<tr class=\"light\">\n";
6587                 }
6588                 $alternate ^= 1;
6589
6590                 my $up = $file_name;
6591                 $up =~ s!/?[^/]+$!!;
6592                 undef $up unless $up;
6593                 # based on git_print_tree_entry
6594                 print '<td class="mode">' . mode_str('040000') . "</td>\n";
6595                 print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6596                 print '<td class="list">';
6597                 print $cgi->a({-href => href(action=>"tree",
6598                                              hash_base=>$hash_base,
6599                                              file_name=>$up)},
6600                               "..");
6601                 print "</td>\n";
6602                 print "<td class=\"link\"></td>\n";
6603
6604                 print "</tr>\n";
6605         }
6606         foreach my $line (@entries) {
6607                 my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6608
6609                 if ($alternate) {
6610                         print "<tr class=\"dark\">\n";
6611                 } else {
6612                         print "<tr class=\"light\">\n";
6613                 }
6614                 $alternate ^= 1;
6615
6616                 git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6617
6618                 print "</tr>\n";
6619         }
6620         print "</table>\n" .
6621               "</div>";
6622         git_footer_html();
6623 }
6624
6625 sub snapshot_name {
6626         my ($project, $hash) = @_;
6627
6628         # path/to/project.git  -> project
6629         # path/to/project/.git -> project
6630         my $name = to_utf8($project);
6631         $name =~ s,([^/])/*\.git$,$1,;
6632         $name = basename($name);
6633         # sanitize name
6634         $name =~ s/[[:cntrl:]]/?/g;
6635
6636         my $ver = $hash;
6637         if ($hash =~ /^[0-9a-fA-F]+$/) {
6638                 # shorten SHA-1 hash
6639                 my $full_hash = git_get_full_hash($project, $hash);
6640                 if ($full_hash =~ /^$hash/ && length($hash) > 7) {
6641                         $ver = git_get_short_hash($project, $hash);
6642                 }
6643         } elsif ($hash =~ m!^refs/tags/(.*)$!) {
6644                 # tags don't need shortened SHA-1 hash
6645                 $ver = $1;
6646         } else {
6647                 # branches and other need shortened SHA-1 hash
6648                 if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
6649                         $ver = $1;
6650                 }
6651                 $ver .= '-' . git_get_short_hash($project, $hash);
6652         }
6653         # in case of hierarchical branch names
6654         $ver =~ s!/!.!g;
6655
6656         # name = project-version_string
6657         $name = "$name-$ver";
6658
6659         return wantarray ? ($name, $name) : $name;
6660 }
6661
6662 sub git_snapshot {
6663         my $format = $input_params{'snapshot_format'};
6664         if (!@snapshot_fmts) {
6665                 die_error(403, "Snapshots not allowed");
6666         }
6667         # default to first supported snapshot format
6668         $format ||= $snapshot_fmts[0];
6669         if ($format !~ m/^[a-z0-9]+$/) {
6670                 die_error(400, "Invalid snapshot format parameter");
6671         } elsif (!exists($known_snapshot_formats{$format})) {
6672                 die_error(400, "Unknown snapshot format");
6673         } elsif ($known_snapshot_formats{$format}{'disabled'}) {
6674                 die_error(403, "Snapshot format not allowed");
6675         } elsif (!grep($_ eq $format, @snapshot_fmts)) {
6676                 die_error(403, "Unsupported snapshot format");
6677         }
6678
6679         my $type = git_get_type("$hash^{}");
6680         if (!$type) {
6681                 die_error(404, 'Object does not exist');
6682         }  elsif ($type eq 'blob') {
6683                 die_error(400, 'Object is not a tree-ish');
6684         }
6685
6686         my ($name, $prefix) = snapshot_name($project, $hash);
6687         my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
6688         my $cmd = quote_command(
6689                 git_cmd(), 'archive',
6690                 "--format=$known_snapshot_formats{$format}{'format'}",
6691                 "--prefix=$prefix/", $hash);
6692         if (exists $known_snapshot_formats{$format}{'compressor'}) {
6693                 $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
6694         }
6695
6696         $filename =~ s/(["\\])/\\$1/g;
6697         print $cgi->header(
6698                 -type => $known_snapshot_formats{$format}{'type'},
6699                 -content_disposition => 'inline; filename="' . $filename . '"',
6700                 -status => '200 OK');
6701
6702         open my $fd, "-|", $cmd
6703                 or die_error(500, "Execute git-archive failed");
6704         binmode STDOUT, ':raw';
6705         print <$fd>;
6706         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6707         close $fd;
6708 }
6709
6710 sub git_log_generic {
6711         my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
6712
6713         my $head = git_get_head_hash($project);
6714         if (!defined $base) {
6715                 $base = $head;
6716         }
6717         if (!defined $page) {
6718                 $page = 0;
6719         }
6720         my $refs = git_get_references();
6721
6722         my $commit_hash = $base;
6723         if (defined $parent) {
6724                 $commit_hash = "$parent..$base";
6725         }
6726         my @commitlist =
6727                 parse_commits($commit_hash, 101, (100 * $page),
6728                               defined $file_name ? ($file_name, "--full-history") : ());
6729
6730         my $ftype;
6731         if (!defined $file_hash && defined $file_name) {
6732                 # some commits could have deleted file in question,
6733                 # and not have it in tree, but one of them has to have it
6734                 for (my $i = 0; $i < @commitlist; $i++) {
6735                         $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
6736                         last if defined $file_hash;
6737                 }
6738         }
6739         if (defined $file_hash) {
6740                 $ftype = git_get_type($file_hash);
6741         }
6742         if (defined $file_name && !defined $ftype) {
6743                 die_error(500, "Unknown type of object");
6744         }
6745         my %co;
6746         if (defined $file_name) {
6747                 %co = parse_commit($base)
6748                         or die_error(404, "Unknown commit object");
6749         }
6750
6751
6752         my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
6753         my $next_link = '';
6754         if ($#commitlist >= 100) {
6755                 $next_link =
6756                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
6757                                  -accesskey => "n", -title => "Alt-n"}, "next");
6758         }
6759         my $patch_max = gitweb_get_feature('patches');
6760         if ($patch_max && !defined $file_name) {
6761                 if ($patch_max < 0 || @commitlist <= $patch_max) {
6762                         $paging_nav .= " &sdot; " .
6763                                 $cgi->a({-href => href(action=>"patches", -replay=>1)},
6764                                         "patches");
6765                 }
6766         }
6767
6768         git_header_html();
6769         git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
6770         if (defined $file_name) {
6771                 git_print_header_div('commit', esc_html($co{'title'}), $base);
6772         } else {
6773                 git_print_header_div('summary', $project)
6774         }
6775         git_print_page_path($file_name, $ftype, $hash_base)
6776                 if (defined $file_name);
6777
6778         $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
6779                      $file_name, $file_hash, $ftype);
6780
6781         git_footer_html();
6782 }
6783
6784 sub git_log {
6785         git_log_generic('log', \&git_log_body,
6786                         $hash, $hash_parent);
6787 }
6788
6789 sub git_commit {
6790         $hash ||= $hash_base || "HEAD";
6791         my %co = parse_commit($hash)
6792             or die_error(404, "Unknown commit object");
6793
6794         my $parent  = $co{'parent'};
6795         my $parents = $co{'parents'}; # listref
6796
6797         # we need to prepare $formats_nav before any parameter munging
6798         my $formats_nav;
6799         if (!defined $parent) {
6800                 # --root commitdiff
6801                 $formats_nav .= '(initial)';
6802         } elsif (@$parents == 1) {
6803                 # single parent commit
6804                 $formats_nav .=
6805                         '(parent: ' .
6806                         $cgi->a({-href => href(action=>"commit",
6807                                                hash=>$parent)},
6808                                 esc_html(substr($parent, 0, 7))) .
6809                         ')';
6810         } else {
6811                 # merge commit
6812                 $formats_nav .=
6813                         '(merge: ' .
6814                         join(' ', map {
6815                                 $cgi->a({-href => href(action=>"commit",
6816                                                        hash=>$_)},
6817                                         esc_html(substr($_, 0, 7)));
6818                         } @$parents ) .
6819                         ')';
6820         }
6821         if (gitweb_check_feature('patches') && @$parents <= 1) {
6822                 $formats_nav .= " | " .
6823                         $cgi->a({-href => href(action=>"patch", -replay=>1)},
6824                                 "patch");
6825         }
6826
6827         if (!defined $parent) {
6828                 $parent = "--root";
6829         }
6830         my @difftree;
6831         open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
6832                 @diff_opts,
6833                 (@$parents <= 1 ? $parent : '-c'),
6834                 $hash, "--"
6835                 or die_error(500, "Open git-diff-tree failed");
6836         @difftree = map { chomp; $_ } <$fd>;
6837         close $fd or die_error(404, "Reading git-diff-tree failed");
6838
6839         # non-textual hash id's can be cached
6840         my $expires;
6841         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6842                 $expires = "+1d";
6843         }
6844         my $refs = git_get_references();
6845         my $ref = format_ref_marker($refs, $co{'id'});
6846
6847         git_header_html(undef, $expires);
6848         git_print_page_nav('commit', '',
6849                            $hash, $co{'tree'}, $hash,
6850                            $formats_nav);
6851
6852         if (defined $co{'parent'}) {
6853                 git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
6854         } else {
6855                 git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
6856         }
6857         print "<div class=\"title_text\">\n" .
6858               "<table class=\"object_header\">\n";
6859         git_print_authorship_rows(\%co);
6860         print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
6861         print "<tr>" .
6862               "<td>tree</td>" .
6863               "<td class=\"sha1\">" .
6864               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
6865                        class => "list"}, $co{'tree'}) .
6866               "</td>" .
6867               "<td class=\"link\">" .
6868               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
6869                       "tree");
6870         my $snapshot_links = format_snapshot_links($hash);
6871         if (defined $snapshot_links) {
6872                 print " | " . $snapshot_links;
6873         }
6874         print "</td>" .
6875               "</tr>\n";
6876
6877         foreach my $par (@$parents) {
6878                 print "<tr>" .
6879                       "<td>parent</td>" .
6880                       "<td class=\"sha1\">" .
6881                       $cgi->a({-href => href(action=>"commit", hash=>$par),
6882                                class => "list"}, $par) .
6883                       "</td>" .
6884                       "<td class=\"link\">" .
6885                       $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
6886                       " | " .
6887                       $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
6888                       "</td>" .
6889                       "</tr>\n";
6890         }
6891         print "</table>".
6892               "</div>\n";
6893
6894         print "<div class=\"page_body\">\n";
6895         git_print_log($co{'comment'});
6896         print "</div>\n";
6897
6898         git_difftree_body(\@difftree, $hash, @$parents);
6899
6900         git_footer_html();
6901 }
6902
6903 sub git_object {
6904         # object is defined by:
6905         # - hash or hash_base alone
6906         # - hash_base and file_name
6907         my $type;
6908
6909         # - hash or hash_base alone
6910         if ($hash || ($hash_base && !defined $file_name)) {
6911                 my $object_id = $hash || $hash_base;
6912
6913                 open my $fd, "-|", quote_command(
6914                         git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
6915                         or die_error(404, "Object does not exist");
6916                 $type = <$fd>;
6917                 chomp $type;
6918                 close $fd
6919                         or die_error(404, "Object does not exist");
6920
6921         # - hash_base and file_name
6922         } elsif ($hash_base && defined $file_name) {
6923                 $file_name =~ s,/+$,,;
6924
6925                 system(git_cmd(), "cat-file", '-e', $hash_base) == 0
6926                         or die_error(404, "Base object does not exist");
6927
6928                 # here errors should not hapen
6929                 open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
6930                         or die_error(500, "Open git-ls-tree failed");
6931                 my $line = <$fd>;
6932                 close $fd;
6933
6934                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
6935                 unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
6936                         die_error(404, "File or directory for given base does not exist");
6937                 }
6938                 $type = $2;
6939                 $hash = $3;
6940         } else {
6941                 die_error(400, "Not enough information to find object");
6942         }
6943
6944         print $cgi->redirect(-uri => href(action=>$type, -full=>1,
6945                                           hash=>$hash, hash_base=>$hash_base,
6946                                           file_name=>$file_name),
6947                              -status => '302 Found');
6948 }
6949
6950 sub git_blobdiff {
6951         my $format = shift || 'html';
6952
6953         my $fd;
6954         my @difftree;
6955         my %diffinfo;
6956         my $expires;
6957
6958         # preparing $fd and %diffinfo for git_patchset_body
6959         # new style URI
6960         if (defined $hash_base && defined $hash_parent_base) {
6961                 if (defined $file_name) {
6962                         # read raw output
6963                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6964                                 $hash_parent_base, $hash_base,
6965                                 "--", (defined $file_parent ? $file_parent : ()), $file_name
6966                                 or die_error(500, "Open git-diff-tree failed");
6967                         @difftree = map { chomp; $_ } <$fd>;
6968                         close $fd
6969                                 or die_error(404, "Reading git-diff-tree failed");
6970                         @difftree
6971                                 or die_error(404, "Blob diff not found");
6972
6973                 } elsif (defined $hash &&
6974                          $hash =~ /[0-9a-fA-F]{40}/) {
6975                         # try to find filename from $hash
6976
6977                         # read filtered raw output
6978                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6979                                 $hash_parent_base, $hash_base, "--"
6980                                 or die_error(500, "Open git-diff-tree failed");
6981                         @difftree =
6982                                 # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
6983                                 # $hash == to_id
6984                                 grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
6985                                 map { chomp; $_ } <$fd>;
6986                         close $fd
6987                                 or die_error(404, "Reading git-diff-tree failed");
6988                         @difftree
6989                                 or die_error(404, "Blob diff not found");
6990
6991                 } else {
6992                         die_error(400, "Missing one of the blob diff parameters");
6993                 }
6994
6995                 if (@difftree > 1) {
6996                         die_error(400, "Ambiguous blob diff specification");
6997                 }
6998
6999                 %diffinfo = parse_difftree_raw_line($difftree[0]);
7000                 $file_parent ||= $diffinfo{'from_file'} || $file_name;
7001                 $file_name   ||= $diffinfo{'to_file'};
7002
7003                 $hash_parent ||= $diffinfo{'from_id'};
7004                 $hash        ||= $diffinfo{'to_id'};
7005
7006                 # non-textual hash id's can be cached
7007                 if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7008                     $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7009                         $expires = '+1d';
7010                 }
7011
7012                 # open patch output
7013                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7014                         '-p', ($format eq 'html' ? "--full-index" : ()),
7015                         $hash_parent_base, $hash_base,
7016                         "--", (defined $file_parent ? $file_parent : ()), $file_name
7017                         or die_error(500, "Open git-diff-tree failed");
7018         }
7019
7020         # old/legacy style URI -- not generated anymore since 1.4.3.
7021         if (!%diffinfo) {
7022                 die_error('404 Not Found', "Missing one of the blob diff parameters")
7023         }
7024
7025         # header
7026         if ($format eq 'html') {
7027                 my $formats_nav =
7028                         $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7029                                 "raw");
7030                 git_header_html(undef, $expires);
7031                 if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7032                         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7033                         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7034                 } else {
7035                         print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7036                         print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7037                 }
7038                 if (defined $file_name) {
7039                         git_print_page_path($file_name, "blob", $hash_base);
7040                 } else {
7041                         print "<div class=\"page_path\"></div>\n";
7042                 }
7043
7044         } elsif ($format eq 'plain') {
7045                 print $cgi->header(
7046                         -type => 'text/plain',
7047                         -charset => 'utf-8',
7048                         -expires => $expires,
7049                         -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7050
7051                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7052
7053         } else {
7054                 die_error(400, "Unknown blobdiff format");
7055         }
7056
7057         # patch
7058         if ($format eq 'html') {
7059                 print "<div class=\"page_body\">\n";
7060
7061                 git_patchset_body($fd, [ \%diffinfo ], $hash_base, $hash_parent_base);
7062                 close $fd;
7063
7064                 print "</div>\n"; # class="page_body"
7065                 git_footer_html();
7066
7067         } else {
7068                 while (my $line = <$fd>) {
7069                         $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7070                         $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7071
7072                         print $line;
7073
7074                         last if $line =~ m!^\+\+\+!;
7075                 }
7076                 local $/ = undef;
7077                 print <$fd>;
7078                 close $fd;
7079         }
7080 }
7081
7082 sub git_blobdiff_plain {
7083         git_blobdiff('plain');
7084 }
7085
7086 sub git_commitdiff {
7087         my %params = @_;
7088         my $format = $params{-format} || 'html';
7089
7090         my ($patch_max) = gitweb_get_feature('patches');
7091         if ($format eq 'patch') {
7092                 die_error(403, "Patch view not allowed") unless $patch_max;
7093         }
7094
7095         $hash ||= $hash_base || "HEAD";
7096         my %co = parse_commit($hash)
7097             or die_error(404, "Unknown commit object");
7098
7099         # choose format for commitdiff for merge
7100         if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7101                 $hash_parent = '--cc';
7102         }
7103         # we need to prepare $formats_nav before almost any parameter munging
7104         my $formats_nav;
7105         if ($format eq 'html') {
7106                 $formats_nav =
7107                         $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7108                                 "raw");
7109                 if ($patch_max && @{$co{'parents'}} <= 1) {
7110                         $formats_nav .= " | " .
7111                                 $cgi->a({-href => href(action=>"patch", -replay=>1)},
7112                                         "patch");
7113                 }
7114
7115                 if (defined $hash_parent &&
7116                     $hash_parent ne '-c' && $hash_parent ne '--cc') {
7117                         # commitdiff with two commits given
7118                         my $hash_parent_short = $hash_parent;
7119                         if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7120                                 $hash_parent_short = substr($hash_parent, 0, 7);
7121                         }
7122                         $formats_nav .=
7123                                 ' (from';
7124                         for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7125                                 if ($co{'parents'}[$i] eq $hash_parent) {
7126                                         $formats_nav .= ' parent ' . ($i+1);
7127                                         last;
7128                                 }
7129                         }
7130                         $formats_nav .= ': ' .
7131                                 $cgi->a({-href => href(action=>"commitdiff",
7132                                                        hash=>$hash_parent)},
7133                                         esc_html($hash_parent_short)) .
7134                                 ')';
7135                 } elsif (!$co{'parent'}) {
7136                         # --root commitdiff
7137                         $formats_nav .= ' (initial)';
7138                 } elsif (scalar @{$co{'parents'}} == 1) {
7139                         # single parent commit
7140                         $formats_nav .=
7141                                 ' (parent: ' .
7142                                 $cgi->a({-href => href(action=>"commitdiff",
7143                                                        hash=>$co{'parent'})},
7144                                         esc_html(substr($co{'parent'}, 0, 7))) .
7145                                 ')';
7146                 } else {
7147                         # merge commit
7148                         if ($hash_parent eq '--cc') {
7149                                 $formats_nav .= ' | ' .
7150                                         $cgi->a({-href => href(action=>"commitdiff",
7151                                                                hash=>$hash, hash_parent=>'-c')},
7152                                                 'combined');
7153                         } else { # $hash_parent eq '-c'
7154                                 $formats_nav .= ' | ' .
7155                                         $cgi->a({-href => href(action=>"commitdiff",
7156                                                                hash=>$hash, hash_parent=>'--cc')},
7157                                                 'compact');
7158                         }
7159                         $formats_nav .=
7160                                 ' (merge: ' .
7161                                 join(' ', map {
7162                                         $cgi->a({-href => href(action=>"commitdiff",
7163                                                                hash=>$_)},
7164                                                 esc_html(substr($_, 0, 7)));
7165                                 } @{$co{'parents'}} ) .
7166                                 ')';
7167                 }
7168         }
7169
7170         my $hash_parent_param = $hash_parent;
7171         if (!defined $hash_parent_param) {
7172                 # --cc for multiple parents, --root for parentless
7173                 $hash_parent_param =
7174                         @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7175         }
7176
7177         # read commitdiff
7178         my $fd;
7179         my @difftree;
7180         if ($format eq 'html') {
7181                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7182                         "--no-commit-id", "--patch-with-raw", "--full-index",
7183                         $hash_parent_param, $hash, "--"
7184                         or die_error(500, "Open git-diff-tree failed");
7185
7186                 while (my $line = <$fd>) {
7187                         chomp $line;
7188                         # empty line ends raw part of diff-tree output
7189                         last unless $line;
7190                         push @difftree, scalar parse_difftree_raw_line($line);
7191                 }
7192
7193         } elsif ($format eq 'plain') {
7194                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7195                         '-p', $hash_parent_param, $hash, "--"
7196                         or die_error(500, "Open git-diff-tree failed");
7197         } elsif ($format eq 'patch') {
7198                 # For commit ranges, we limit the output to the number of
7199                 # patches specified in the 'patches' feature.
7200                 # For single commits, we limit the output to a single patch,
7201                 # diverging from the git-format-patch default.
7202                 my @commit_spec = ();
7203                 if ($hash_parent) {
7204                         if ($patch_max > 0) {
7205                                 push @commit_spec, "-$patch_max";
7206                         }
7207                         push @commit_spec, '-n', "$hash_parent..$hash";
7208                 } else {
7209                         if ($params{-single}) {
7210                                 push @commit_spec, '-1';
7211                         } else {
7212                                 if ($patch_max > 0) {
7213                                         push @commit_spec, "-$patch_max";
7214                                 }
7215                                 push @commit_spec, "-n";
7216                         }
7217                         push @commit_spec, '--root', $hash;
7218                 }
7219                 open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7220                         '--encoding=utf8', '--stdout', @commit_spec
7221                         or die_error(500, "Open git-format-patch failed");
7222         } else {
7223                 die_error(400, "Unknown commitdiff format");
7224         }
7225
7226         # non-textual hash id's can be cached
7227         my $expires;
7228         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7229                 $expires = "+1d";
7230         }
7231
7232         # write commit message
7233         if ($format eq 'html') {
7234                 my $refs = git_get_references();
7235                 my $ref = format_ref_marker($refs, $co{'id'});
7236
7237                 git_header_html(undef, $expires);
7238                 git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7239                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7240                 print "<div class=\"title_text\">\n" .
7241                       "<table class=\"object_header\">\n";
7242                 git_print_authorship_rows(\%co);
7243                 print "</table>".
7244                       "</div>\n";
7245                 print "<div class=\"page_body\">\n";
7246                 if (@{$co{'comment'}} > 1) {
7247                         print "<div class=\"log\">\n";
7248                         git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7249                         print "</div>\n"; # class="log"
7250                 }
7251
7252         } elsif ($format eq 'plain') {
7253                 my $refs = git_get_references("tags");
7254                 my $tagname = git_get_rev_name_tags($hash);
7255                 my $filename = basename($project) . "-$hash.patch";
7256
7257                 print $cgi->header(
7258                         -type => 'text/plain',
7259                         -charset => 'utf-8',
7260                         -expires => $expires,
7261                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7262                 my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7263                 print "From: " . to_utf8($co{'author'}) . "\n";
7264                 print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7265                 print "Subject: " . to_utf8($co{'title'}) . "\n";
7266
7267                 print "X-Git-Tag: $tagname\n" if $tagname;
7268                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7269
7270                 foreach my $line (@{$co{'comment'}}) {
7271                         print to_utf8($line) . "\n";
7272                 }
7273                 print "---\n\n";
7274         } elsif ($format eq 'patch') {
7275                 my $filename = basename($project) . "-$hash.patch";
7276
7277                 print $cgi->header(
7278                         -type => 'text/plain',
7279                         -charset => 'utf-8',
7280                         -expires => $expires,
7281                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7282         }
7283
7284         # write patch
7285         if ($format eq 'html') {
7286                 my $use_parents = !defined $hash_parent ||
7287                         $hash_parent eq '-c' || $hash_parent eq '--cc';
7288                 git_difftree_body(\@difftree, $hash,
7289                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7290                 print "<br/>\n";
7291
7292                 git_patchset_body($fd, \@difftree, $hash,
7293                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7294                 close $fd;
7295                 print "</div>\n"; # class="page_body"
7296                 git_footer_html();
7297
7298         } elsif ($format eq 'plain') {
7299                 local $/ = undef;
7300                 print <$fd>;
7301                 close $fd
7302                         or print "Reading git-diff-tree failed\n";
7303         } elsif ($format eq 'patch') {
7304                 local $/ = undef;
7305                 print <$fd>;
7306                 close $fd
7307                         or print "Reading git-format-patch failed\n";
7308         }
7309 }
7310
7311 sub git_commitdiff_plain {
7312         git_commitdiff(-format => 'plain');
7313 }
7314
7315 # format-patch-style patches
7316 sub git_patch {
7317         git_commitdiff(-format => 'patch', -single => 1);
7318 }
7319
7320 sub git_patches {
7321         git_commitdiff(-format => 'patch');
7322 }
7323
7324 sub git_history {
7325         git_log_generic('history', \&git_history_body,
7326                         $hash_base, $hash_parent_base,
7327                         $file_name, $hash);
7328 }
7329
7330 sub git_search {
7331         $searchtype ||= 'commit';
7332
7333         # check if appropriate features are enabled
7334         gitweb_check_feature('search')
7335                 or die_error(403, "Search is disabled");
7336         if ($searchtype eq 'pickaxe') {
7337                 # pickaxe may take all resources of your box and run for several minutes
7338                 # with every query - so decide by yourself how public you make this feature
7339                 gitweb_check_feature('pickaxe')
7340                         or die_error(403, "Pickaxe search is disabled");
7341         }
7342         if ($searchtype eq 'grep') {
7343                 # grep search might be potentially CPU-intensive, too
7344                 gitweb_check_feature('grep')
7345                         or die_error(403, "Grep search is disabled");
7346         }
7347
7348         if (!defined $searchtext) {
7349                 die_error(400, "Text field is empty");
7350         }
7351         if (!defined $hash) {
7352                 $hash = git_get_head_hash($project);
7353         }
7354         my %co = parse_commit($hash);
7355         if (!%co) {
7356                 die_error(404, "Unknown commit object");
7357         }
7358         if (!defined $page) {
7359                 $page = 0;
7360         }
7361
7362         if ($searchtype eq 'commit' ||
7363             $searchtype eq 'author' ||
7364             $searchtype eq 'committer') {
7365                 git_search_message(%co);
7366         } elsif ($searchtype eq 'pickaxe') {
7367                 git_search_changes(%co);
7368         } elsif ($searchtype eq 'grep') {
7369                 git_search_files(%co);
7370         } else {
7371                 die_error(400, "Unknown search type");
7372         }
7373 }
7374
7375 sub git_search_help {
7376         git_header_html();
7377         git_print_page_nav('','', $hash,$hash,$hash);
7378         print <<EOT;
7379 <p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7380 regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7381 the pattern entered is recognized as the POSIX extended
7382 <a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7383 insensitive).</p>
7384 <dl>
7385 <dt><b>commit</b></dt>
7386 <dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7387 EOT
7388         my $have_grep = gitweb_check_feature('grep');
7389         if ($have_grep) {
7390                 print <<EOT;
7391 <dt><b>grep</b></dt>
7392 <dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7393     a different one) are searched for the given pattern. On large trees, this search can take
7394 a while and put some strain on the server, so please use it with some consideration. Note that
7395 due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7396 case-sensitive.</dd>
7397 EOT
7398         }
7399         print <<EOT;
7400 <dt><b>author</b></dt>
7401 <dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7402 <dt><b>committer</b></dt>
7403 <dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7404 EOT
7405         my $have_pickaxe = gitweb_check_feature('pickaxe');
7406         if ($have_pickaxe) {
7407                 print <<EOT;
7408 <dt><b>pickaxe</b></dt>
7409 <dd>All commits that caused the string to appear or disappear from any file (changes that
7410 added, removed or "modified" the string) will be listed. This search can take a while and
7411 takes a lot of strain on the server, so please use it wisely. Note that since you may be
7412 interested even in changes just changing the case as well, this search is case sensitive.</dd>
7413 EOT
7414         }
7415         print "</dl>\n";
7416         git_footer_html();
7417 }
7418
7419 sub git_shortlog {
7420         git_log_generic('shortlog', \&git_shortlog_body,
7421                         $hash, $hash_parent);
7422 }
7423
7424 ## ......................................................................
7425 ## feeds (RSS, Atom; OPML)
7426
7427 sub git_feed {
7428         my $format = shift || 'atom';
7429         my $have_blame = gitweb_check_feature('blame');
7430
7431         # Atom: http://www.atomenabled.org/developers/syndication/
7432         # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7433         if ($format ne 'rss' && $format ne 'atom') {
7434                 die_error(400, "Unknown web feed format");
7435         }
7436
7437         # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7438         my $head = $hash || 'HEAD';
7439         my @commitlist = parse_commits($head, 150, 0, $file_name);
7440
7441         my %latest_commit;
7442         my %latest_date;
7443         my $content_type = "application/$format+xml";
7444         if (defined $cgi->http('HTTP_ACCEPT') &&
7445                  $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7446                 # browser (feed reader) prefers text/xml
7447                 $content_type = 'text/xml';
7448         }
7449         if (defined($commitlist[0])) {
7450                 %latest_commit = %{$commitlist[0]};
7451                 my $latest_epoch = $latest_commit{'committer_epoch'};
7452                 %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7453                 my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7454                 if (defined $if_modified) {
7455                         my $since;
7456                         if (eval { require HTTP::Date; 1; }) {
7457                                 $since = HTTP::Date::str2time($if_modified);
7458                         } elsif (eval { require Time::ParseDate; 1; }) {
7459                                 $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7460                         }
7461                         if (defined $since && $latest_epoch <= $since) {
7462                                 print $cgi->header(
7463                                         -type => $content_type,
7464                                         -charset => 'utf-8',
7465                                         -last_modified => $latest_date{'rfc2822'},
7466                                         -status => '304 Not Modified');
7467                                 return;
7468                         }
7469                 }
7470                 print $cgi->header(
7471                         -type => $content_type,
7472                         -charset => 'utf-8',
7473                         -last_modified => $latest_date{'rfc2822'});
7474         } else {
7475                 print $cgi->header(
7476                         -type => $content_type,
7477                         -charset => 'utf-8');
7478         }
7479
7480         # Optimization: skip generating the body if client asks only
7481         # for Last-Modified date.
7482         return if ($cgi->request_method() eq 'HEAD');
7483
7484         # header variables
7485         my $title = "$site_name - $project/$action";
7486         my $feed_type = 'log';
7487         if (defined $hash) {
7488                 $title .= " - '$hash'";
7489                 $feed_type = 'branch log';
7490                 if (defined $file_name) {
7491                         $title .= " :: $file_name";
7492                         $feed_type = 'history';
7493                 }
7494         } elsif (defined $file_name) {
7495                 $title .= " - $file_name";
7496                 $feed_type = 'history';
7497         }
7498         $title .= " $feed_type";
7499         my $descr = git_get_project_description($project);
7500         if (defined $descr) {
7501                 $descr = esc_html($descr);
7502         } else {
7503                 $descr = "$project " .
7504                          ($format eq 'rss' ? 'RSS' : 'Atom') .
7505                          " feed";
7506         }
7507         my $owner = git_get_project_owner($project);
7508         $owner = esc_html($owner);
7509
7510         #header
7511         my $alt_url;
7512         if (defined $file_name) {
7513                 $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7514         } elsif (defined $hash) {
7515                 $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7516         } else {
7517                 $alt_url = href(-full=>1, action=>"summary");
7518         }
7519         print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7520         if ($format eq 'rss') {
7521                 print <<XML;
7522 <rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7523 <channel>
7524 XML
7525                 print "<title>$title</title>\n" .
7526                       "<link>$alt_url</link>\n" .
7527                       "<description>$descr</description>\n" .
7528                       "<language>en</language>\n" .
7529                       # project owner is responsible for 'editorial' content
7530                       "<managingEditor>$owner</managingEditor>\n";
7531                 if (defined $logo || defined $favicon) {
7532                         # prefer the logo to the favicon, since RSS
7533                         # doesn't allow both
7534                         my $img = esc_url($logo || $favicon);
7535                         print "<image>\n" .
7536                               "<url>$img</url>\n" .
7537                               "<title>$title</title>\n" .
7538                               "<link>$alt_url</link>\n" .
7539                               "</image>\n";
7540                 }
7541                 if (%latest_date) {
7542                         print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7543                         print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7544                 }
7545                 print "<generator>gitweb v.$version/$git_version</generator>\n";
7546         } elsif ($format eq 'atom') {
7547                 print <<XML;
7548 <feed xmlns="http://www.w3.org/2005/Atom">
7549 XML
7550                 print "<title>$title</title>\n" .
7551                       "<subtitle>$descr</subtitle>\n" .
7552                       '<link rel="alternate" type="text/html" href="' .
7553                       $alt_url . '" />' . "\n" .
7554                       '<link rel="self" type="' . $content_type . '" href="' .
7555                       $cgi->self_url() . '" />' . "\n" .
7556                       "<id>" . href(-full=>1) . "</id>\n" .
7557                       # use project owner for feed author
7558                       "<author><name>$owner</name></author>\n";
7559                 if (defined $favicon) {
7560                         print "<icon>" . esc_url($favicon) . "</icon>\n";
7561                 }
7562                 if (defined $logo) {
7563                         # not twice as wide as tall: 72 x 27 pixels
7564                         print "<logo>" . esc_url($logo) . "</logo>\n";
7565                 }
7566                 if (! %latest_date) {
7567                         # dummy date to keep the feed valid until commits trickle in:
7568                         print "<updated>1970-01-01T00:00:00Z</updated>\n";
7569                 } else {
7570                         print "<updated>$latest_date{'iso-8601'}</updated>\n";
7571                 }
7572                 print "<generator version='$version/$git_version'>gitweb</generator>\n";
7573         }
7574
7575         # contents
7576         for (my $i = 0; $i <= $#commitlist; $i++) {
7577                 my %co = %{$commitlist[$i]};
7578                 my $commit = $co{'id'};
7579                 # we read 150, we always show 30 and the ones more recent than 48 hours
7580                 if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7581                         last;
7582                 }
7583                 my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7584
7585                 # get list of changed files
7586                 open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7587                         $co{'parent'} || "--root",
7588                         $co{'id'}, "--", (defined $file_name ? $file_name : ())
7589                         or next;
7590                 my @difftree = map { chomp; $_ } <$fd>;
7591                 close $fd
7592                         or next;
7593
7594                 # print element (entry, item)
7595                 my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7596                 if ($format eq 'rss') {
7597                         print "<item>\n" .
7598                               "<title>" . esc_html($co{'title'}) . "</title>\n" .
7599                               "<author>" . esc_html($co{'author'}) . "</author>\n" .
7600                               "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7601                               "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7602                               "<link>$co_url</link>\n" .
7603                               "<description>" . esc_html($co{'title'}) . "</description>\n" .
7604                               "<content:encoded>" .
7605                               "<![CDATA[\n";
7606                 } elsif ($format eq 'atom') {
7607                         print "<entry>\n" .
7608                               "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7609                               "<updated>$cd{'iso-8601'}</updated>\n" .
7610                               "<author>\n" .
7611                               "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7612                         if ($co{'author_email'}) {
7613                                 print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7614                         }
7615                         print "</author>\n" .
7616                               # use committer for contributor
7617                               "<contributor>\n" .
7618                               "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7619                         if ($co{'committer_email'}) {
7620                                 print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7621                         }
7622                         print "</contributor>\n" .
7623                               "<published>$cd{'iso-8601'}</published>\n" .
7624                               "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7625                               "<id>$co_url</id>\n" .
7626                               "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
7627                               "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
7628                 }
7629                 my $comment = $co{'comment'};
7630                 print "<pre>\n";
7631                 foreach my $line (@$comment) {
7632                         $line = esc_html($line);
7633                         print "$line\n";
7634                 }
7635                 print "</pre><ul>\n";
7636                 foreach my $difftree_line (@difftree) {
7637                         my %difftree = parse_difftree_raw_line($difftree_line);
7638                         next if !$difftree{'from_id'};
7639
7640                         my $file = $difftree{'file'} || $difftree{'to_file'};
7641
7642                         print "<li>" .
7643                               "[" .
7644                               $cgi->a({-href => href(-full=>1, action=>"blobdiff",
7645                                                      hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
7646                                                      hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
7647                                                      file_name=>$file, file_parent=>$difftree{'from_file'}),
7648                                       -title => "diff"}, 'D');
7649                         if ($have_blame) {
7650                                 print $cgi->a({-href => href(-full=>1, action=>"blame",
7651                                                              file_name=>$file, hash_base=>$commit),
7652                                               -title => "blame"}, 'B');
7653                         }
7654                         # if this is not a feed of a file history
7655                         if (!defined $file_name || $file_name ne $file) {
7656                                 print $cgi->a({-href => href(-full=>1, action=>"history",
7657                                                              file_name=>$file, hash=>$commit),
7658                                               -title => "history"}, 'H');
7659                         }
7660                         $file = esc_path($file);
7661                         print "] ".
7662                               "$file</li>\n";
7663                 }
7664                 if ($format eq 'rss') {
7665                         print "</ul>]]>\n" .
7666                               "</content:encoded>\n" .
7667                               "</item>\n";
7668                 } elsif ($format eq 'atom') {
7669                         print "</ul>\n</div>\n" .
7670                               "</content>\n" .
7671                               "</entry>\n";
7672                 }
7673         }
7674
7675         # end of feed
7676         if ($format eq 'rss') {
7677                 print "</channel>\n</rss>\n";
7678         } elsif ($format eq 'atom') {
7679                 print "</feed>\n";
7680         }
7681 }
7682
7683 sub git_rss {
7684         git_feed('rss');
7685 }
7686
7687 sub git_atom {
7688         git_feed('atom');
7689 }
7690
7691 sub git_opml {
7692         my @list = git_get_projects_list();
7693         if (!@list) {
7694                 die_error(404, "No projects found");
7695         }
7696
7697         print $cgi->header(
7698                 -type => 'text/xml',
7699                 -charset => 'utf-8',
7700                 -content_disposition => 'inline; filename="opml.xml"');
7701
7702         print <<XML;
7703 <?xml version="1.0" encoding="utf-8"?>
7704 <opml version="1.0">
7705 <head>
7706   <title>$site_name OPML Export</title>
7707 </head>
7708 <body>
7709 <outline text="git RSS feeds">
7710 XML
7711
7712         foreach my $pr (@list) {
7713                 my %proj = %$pr;
7714                 my $head = git_get_head_hash($proj{'path'});
7715                 if (!defined $head) {
7716                         next;
7717                 }
7718                 $git_dir = "$projectroot/$proj{'path'}";
7719                 my %co = parse_commit($head);
7720                 if (!%co) {
7721                         next;
7722                 }
7723
7724                 my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7725                 my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7726                 my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7727                 print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7728         }
7729         print <<XML;
7730 </outline>
7731 </body>
7732 </opml>
7733 XML
7734 }