Merge branch 'da/gitk-reload-tag-contents' into maint-1.7.11
[git] / gitweb / gitweb.perl
1 #!/usr/bin/perl
2
3 # gitweb - simple web interface to track changes in git repositories
4 #
5 # (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
6 # (C) 2005, Christian Gierke
7 #
8 # This program is licensed under the GPLv2
9
10 use 5.008;
11 use strict;
12 use warnings;
13 use CGI qw(:standard :escapeHTML -nosticky);
14 use CGI::Util qw(unescape);
15 use CGI::Carp qw(fatalsToBrowser set_message);
16 use Encode;
17 use Fcntl ':mode';
18 use File::Find qw();
19 use File::Basename qw(basename);
20 use Time::HiRes qw(gettimeofday tv_interval);
21 binmode STDOUT, ':utf8';
22
23 our $t0 = [ gettimeofday() ];
24 our $number_of_git_cmds = 0;
25
26 BEGIN {
27         CGI->compile() if $ENV{'MOD_PERL'};
28 }
29
30 our $version = "++GIT_VERSION++";
31
32 our ($my_url, $my_uri, $base_url, $path_info, $home_link);
33 sub evaluate_uri {
34         our $cgi;
35
36         our $my_url = $cgi->url();
37         our $my_uri = $cgi->url(-absolute => 1);
38
39         # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
40         # needed and used only for URLs with nonempty PATH_INFO
41         our $base_url = $my_url;
42
43         # When the script is used as DirectoryIndex, the URL does not contain the name
44         # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
45         # have to do it ourselves. We make $path_info global because it's also used
46         # later on.
47         #
48         # Another issue with the script being the DirectoryIndex is that the resulting
49         # $my_url data is not the full script URL: this is good, because we want
50         # generated links to keep implying the script name if it wasn't explicitly
51         # indicated in the URL we're handling, but it means that $my_url cannot be used
52         # as base URL.
53         # Therefore, if we needed to strip PATH_INFO, then we know that we have
54         # to build the base URL ourselves:
55         our $path_info = decode_utf8($ENV{"PATH_INFO"});
56         if ($path_info) {
57                 # $path_info has already been URL-decoded by the web server, but
58                 # $my_url and $my_uri have not. URL-decode them so we can properly
59                 # strip $path_info.
60                 $my_url = unescape($my_url);
61                 $my_uri = unescape($my_uri);
62                 if ($my_url =~ s,\Q$path_info\E$,, &&
63                     $my_uri =~ s,\Q$path_info\E$,, &&
64                     defined $ENV{'SCRIPT_NAME'}) {
65                         $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
66                 }
67         }
68
69         # target of the home link on top of all pages
70         our $home_link = $my_uri || "/";
71 }
72
73 # core git executable to use
74 # this can just be "git" if your webserver has a sensible PATH
75 our $GIT = "++GIT_BINDIR++/git";
76
77 # absolute fs-path which will be prepended to the project path
78 #our $projectroot = "/pub/scm";
79 our $projectroot = "++GITWEB_PROJECTROOT++";
80
81 # fs traversing limit for getting project list
82 # the number is relative to the projectroot
83 our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
84
85 # string of the home link on top of all pages
86 our $home_link_str = "++GITWEB_HOME_LINK_STR++";
87
88 # name of your site or organization to appear in page titles
89 # replace this with something more descriptive for clearer bookmarks
90 our $site_name = "++GITWEB_SITENAME++"
91                  || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
92
93 # html snippet to include in the <head> section of each page
94 our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
95 # filename of html text to include at top of each page
96 our $site_header = "++GITWEB_SITE_HEADER++";
97 # html text to include at home page
98 our $home_text = "++GITWEB_HOMETEXT++";
99 # filename of html text to include at bottom of each page
100 our $site_footer = "++GITWEB_SITE_FOOTER++";
101
102 # URI of stylesheets
103 our @stylesheets = ("++GITWEB_CSS++");
104 # URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
105 our $stylesheet = undef;
106 # URI of GIT logo (72x27 size)
107 our $logo = "++GITWEB_LOGO++";
108 # URI of GIT favicon, assumed to be image/png type
109 our $favicon = "++GITWEB_FAVICON++";
110 # URI of gitweb.js (JavaScript code for gitweb)
111 our $javascript = "++GITWEB_JS++";
112
113 # URI and label (title) of GIT logo link
114 #our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
115 #our $logo_label = "git documentation";
116 our $logo_url = "http://git-scm.com/";
117 our $logo_label = "git homepage";
118
119 # source of projects list
120 our $projects_list = "++GITWEB_LIST++";
121
122 # the width (in characters) of the projects list "Description" column
123 our $projects_list_description_width = 25;
124
125 # group projects by category on the projects list
126 # (enabled if this variable evaluates to true)
127 our $projects_list_group_categories = 0;
128
129 # default category if none specified
130 # (leave the empty string for no category)
131 our $project_list_default_category = "";
132
133 # default order of projects list
134 # valid values are none, project, descr, owner, and age
135 our $default_projects_order = "project";
136
137 # show repository only if this file exists
138 # (only effective if this variable evaluates to true)
139 our $export_ok = "++GITWEB_EXPORT_OK++";
140
141 # don't generate age column on the projects list page
142 our $omit_age_column = 0;
143
144 # don't generate information about owners of repositories
145 our $omit_owner=0;
146
147 # show repository only if this subroutine returns true
148 # when given the path to the project, for example:
149 #    sub { return -e "$_[0]/git-daemon-export-ok"; }
150 our $export_auth_hook = undef;
151
152 # only allow viewing of repositories also shown on the overview page
153 our $strict_export = "++GITWEB_STRICT_EXPORT++";
154
155 # list of git base URLs used for URL to where fetch project from,
156 # i.e. full URL is "$git_base_url/$project"
157 our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
158
159 # default blob_plain mimetype and default charset for text/plain blob
160 our $default_blob_plain_mimetype = 'text/plain';
161 our $default_text_plain_charset  = undef;
162
163 # file to use for guessing MIME types before trying /etc/mime.types
164 # (relative to the current git repository)
165 our $mimetypes_file = undef;
166
167 # assume this charset if line contains non-UTF-8 characters;
168 # it should be valid encoding (see Encoding::Supported(3pm) for list),
169 # for which encoding all byte sequences are valid, for example
170 # 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
171 # could be even 'utf-8' for the old behavior)
172 our $fallback_encoding = 'latin1';
173
174 # rename detection options for git-diff and git-diff-tree
175 # - default is '-M', with the cost proportional to
176 #   (number of removed files) * (number of new files).
177 # - more costly is '-C' (which implies '-M'), with the cost proportional to
178 #   (number of changed files + number of removed files) * (number of new files)
179 # - even more costly is '-C', '--find-copies-harder' with cost
180 #   (number of files in the original tree) * (number of new files)
181 # - one might want to include '-B' option, e.g. '-B', '-M'
182 our @diff_opts = ('-M'); # taken from git_commit
183
184 # Disables features that would allow repository owners to inject script into
185 # the gitweb domain.
186 our $prevent_xss = 0;
187
188 # Path to the highlight executable to use (must be the one from
189 # http://www.andre-simon.de due to assumptions about parameters and output).
190 # Useful if highlight is not installed on your webserver's PATH.
191 # [Default: highlight]
192 our $highlight_bin = "++HIGHLIGHT_BIN++";
193
194 # information about snapshot formats that gitweb is capable of serving
195 our %known_snapshot_formats = (
196         # name => {
197         #       'display' => display name,
198         #       'type' => mime type,
199         #       'suffix' => filename suffix,
200         #       'format' => --format for git-archive,
201         #       'compressor' => [compressor command and arguments]
202         #                       (array reference, optional)
203         #       'disabled' => boolean (optional)}
204         #
205         'tgz' => {
206                 'display' => 'tar.gz',
207                 'type' => 'application/x-gzip',
208                 'suffix' => '.tar.gz',
209                 'format' => 'tar',
210                 'compressor' => ['gzip', '-n']},
211
212         'tbz2' => {
213                 'display' => 'tar.bz2',
214                 'type' => 'application/x-bzip2',
215                 'suffix' => '.tar.bz2',
216                 'format' => 'tar',
217                 'compressor' => ['bzip2']},
218
219         'txz' => {
220                 'display' => 'tar.xz',
221                 'type' => 'application/x-xz',
222                 'suffix' => '.tar.xz',
223                 'format' => 'tar',
224                 'compressor' => ['xz'],
225                 'disabled' => 1},
226
227         'zip' => {
228                 'display' => 'zip',
229                 'type' => 'application/x-zip',
230                 'suffix' => '.zip',
231                 'format' => 'zip'},
232 );
233
234 # Aliases so we understand old gitweb.snapshot values in repository
235 # configuration.
236 our %known_snapshot_format_aliases = (
237         'gzip'  => 'tgz',
238         'bzip2' => 'tbz2',
239         'xz'    => 'txz',
240
241         # backward compatibility: legacy gitweb config support
242         'x-gzip' => undef, 'gz' => undef,
243         'x-bzip2' => undef, 'bz2' => undef,
244         'x-zip' => undef, '' => undef,
245 );
246
247 # Pixel sizes for icons and avatars. If the default font sizes or lineheights
248 # are changed, it may be appropriate to change these values too via
249 # $GITWEB_CONFIG.
250 our %avatar_size = (
251         'default' => 16,
252         'double'  => 32
253 );
254
255 # Used to set the maximum load that we will still respond to gitweb queries.
256 # If server load exceed this value then return "503 server busy" error.
257 # If gitweb cannot determined server load, it is taken to be 0.
258 # Leave it undefined (or set to 'undef') to turn off load checking.
259 our $maxload = 300;
260
261 # configuration for 'highlight' (http://www.andre-simon.de/)
262 # match by basename
263 our %highlight_basename = (
264         #'Program' => 'py',
265         #'Library' => 'py',
266         'SConstruct' => 'py', # SCons equivalent of Makefile
267         'Makefile' => 'make',
268 );
269 # match by extension
270 our %highlight_ext = (
271         # main extensions, defining name of syntax;
272         # see files in /usr/share/highlight/langDefs/ directory
273         map { $_ => $_ }
274                 qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
275         # alternate extensions, see /etc/highlight/filetypes.conf
276         'h' => 'c',
277         map { $_ => 'sh'  } qw(bash zsh ksh),
278         map { $_ => 'cpp' } qw(cxx c++ cc),
279         map { $_ => 'php' } qw(php3 php4 php5 phps),
280         map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
281         map { $_ => 'make'} qw(mak mk),
282         map { $_ => 'xml' } qw(xhtml html htm),
283 );
284
285 # You define site-wide feature defaults here; override them with
286 # $GITWEB_CONFIG as necessary.
287 our %feature = (
288         # feature => {
289         #       'sub' => feature-sub (subroutine),
290         #       'override' => allow-override (boolean),
291         #       'default' => [ default options...] (array reference)}
292         #
293         # if feature is overridable (it means that allow-override has true value),
294         # then feature-sub will be called with default options as parameters;
295         # return value of feature-sub indicates if to enable specified feature
296         #
297         # if there is no 'sub' key (no feature-sub), then feature cannot be
298         # overridden
299         #
300         # use gitweb_get_feature(<feature>) to retrieve the <feature> value
301         # (an array) or gitweb_check_feature(<feature>) to check if <feature>
302         # is enabled
303
304         # Enable the 'blame' blob view, showing the last commit that modified
305         # each line in the file. This can be very CPU-intensive.
306
307         # To enable system wide have in $GITWEB_CONFIG
308         # $feature{'blame'}{'default'} = [1];
309         # To have project specific config enable override in $GITWEB_CONFIG
310         # $feature{'blame'}{'override'} = 1;
311         # and in project config gitweb.blame = 0|1;
312         'blame' => {
313                 'sub' => sub { feature_bool('blame', @_) },
314                 'override' => 0,
315                 'default' => [0]},
316
317         # Enable the 'snapshot' link, providing a compressed archive of any
318         # tree. This can potentially generate high traffic if you have large
319         # project.
320
321         # Value is a list of formats defined in %known_snapshot_formats that
322         # you wish to offer.
323         # To disable system wide have in $GITWEB_CONFIG
324         # $feature{'snapshot'}{'default'} = [];
325         # To have project specific config enable override in $GITWEB_CONFIG
326         # $feature{'snapshot'}{'override'} = 1;
327         # and in project config, a comma-separated list of formats or "none"
328         # to disable.  Example: gitweb.snapshot = tbz2,zip;
329         'snapshot' => {
330                 'sub' => \&feature_snapshot,
331                 'override' => 0,
332                 'default' => ['tgz']},
333
334         # Enable text search, which will list the commits which match author,
335         # committer or commit text to a given string.  Enabled by default.
336         # Project specific override is not supported.
337         #
338         # Note that this controls all search features, which means that if
339         # it is disabled, then 'grep' and 'pickaxe' search would also be
340         # disabled.
341         'search' => {
342                 'override' => 0,
343                 'default' => [1]},
344
345         # Enable grep search, which will list the files in currently selected
346         # tree containing the given string. Enabled by default. This can be
347         # potentially CPU-intensive, of course.
348         # Note that you need to have 'search' feature enabled too.
349
350         # To enable system wide have in $GITWEB_CONFIG
351         # $feature{'grep'}{'default'} = [1];
352         # To have project specific config enable override in $GITWEB_CONFIG
353         # $feature{'grep'}{'override'} = 1;
354         # and in project config gitweb.grep = 0|1;
355         'grep' => {
356                 'sub' => sub { feature_bool('grep', @_) },
357                 'override' => 0,
358                 'default' => [1]},
359
360         # Enable the pickaxe search, which will list the commits that modified
361         # a given string in a file. This can be practical and quite faster
362         # alternative to 'blame', but still potentially CPU-intensive.
363         # Note that you need to have 'search' feature enabled too.
364
365         # To enable system wide have in $GITWEB_CONFIG
366         # $feature{'pickaxe'}{'default'} = [1];
367         # To have project specific config enable override in $GITWEB_CONFIG
368         # $feature{'pickaxe'}{'override'} = 1;
369         # and in project config gitweb.pickaxe = 0|1;
370         'pickaxe' => {
371                 'sub' => sub { feature_bool('pickaxe', @_) },
372                 'override' => 0,
373                 'default' => [1]},
374
375         # Enable showing size of blobs in a 'tree' view, in a separate
376         # column, similar to what 'ls -l' does.  This cost a bit of IO.
377
378         # To disable system wide have in $GITWEB_CONFIG
379         # $feature{'show-sizes'}{'default'} = [0];
380         # To have project specific config enable override in $GITWEB_CONFIG
381         # $feature{'show-sizes'}{'override'} = 1;
382         # and in project config gitweb.showsizes = 0|1;
383         'show-sizes' => {
384                 'sub' => sub { feature_bool('showsizes', @_) },
385                 'override' => 0,
386                 'default' => [1]},
387
388         # Make gitweb use an alternative format of the URLs which can be
389         # more readable and natural-looking: project name is embedded
390         # directly in the path and the query string contains other
391         # auxiliary information. All gitweb installations recognize
392         # URL in either format; this configures in which formats gitweb
393         # generates links.
394
395         # To enable system wide have in $GITWEB_CONFIG
396         # $feature{'pathinfo'}{'default'} = [1];
397         # Project specific override is not supported.
398
399         # Note that you will need to change the default location of CSS,
400         # favicon, logo and possibly other files to an absolute URL. Also,
401         # if gitweb.cgi serves as your indexfile, you will need to force
402         # $my_uri to contain the script name in your $GITWEB_CONFIG.
403         'pathinfo' => {
404                 'override' => 0,
405                 'default' => [0]},
406
407         # Make gitweb consider projects in project root subdirectories
408         # to be forks of existing projects. Given project $projname.git,
409         # projects matching $projname/*.git will not be shown in the main
410         # projects list, instead a '+' mark will be added to $projname
411         # there and a 'forks' view will be enabled for the project, listing
412         # all the forks. If project list is taken from a file, forks have
413         # to be listed after the main project.
414
415         # To enable system wide have in $GITWEB_CONFIG
416         # $feature{'forks'}{'default'} = [1];
417         # Project specific override is not supported.
418         'forks' => {
419                 'override' => 0,
420                 'default' => [0]},
421
422         # Insert custom links to the action bar of all project pages.
423         # This enables you mainly to link to third-party scripts integrating
424         # into gitweb; e.g. git-browser for graphical history representation
425         # or custom web-based repository administration interface.
426
427         # The 'default' value consists of a list of triplets in the form
428         # (label, link, position) where position is the label after which
429         # to insert the link and link is a format string where %n expands
430         # to the project name, %f to the project path within the filesystem,
431         # %h to the current hash (h gitweb parameter) and %b to the current
432         # hash base (hb gitweb parameter); %% expands to %.
433
434         # To enable system wide have in $GITWEB_CONFIG e.g.
435         # $feature{'actions'}{'default'} = [('graphiclog',
436         #       '/git-browser/by-commit.html?r=%n', 'summary')];
437         # Project specific override is not supported.
438         'actions' => {
439                 'override' => 0,
440                 'default' => []},
441
442         # Allow gitweb scan project content tags of project repository,
443         # and display the popular Web 2.0-ish "tag cloud" near the projects
444         # list.  Note that this is something COMPLETELY different from the
445         # normal Git tags.
446
447         # gitweb by itself can show existing tags, but it does not handle
448         # tagging itself; you need to do it externally, outside gitweb.
449         # The format is described in git_get_project_ctags() subroutine.
450         # You may want to install the HTML::TagCloud Perl module to get
451         # a pretty tag cloud instead of just a list of tags.
452
453         # To enable system wide have in $GITWEB_CONFIG
454         # $feature{'ctags'}{'default'} = [1];
455         # Project specific override is not supported.
456
457         # In the future whether ctags editing is enabled might depend
458         # on the value, but using 1 should always mean no editing of ctags.
459         'ctags' => {
460                 'override' => 0,
461                 'default' => [0]},
462
463         # The maximum number of patches in a patchset generated in patch
464         # view. Set this to 0 or undef to disable patch view, or to a
465         # negative number to remove any limit.
466
467         # To disable system wide have in $GITWEB_CONFIG
468         # $feature{'patches'}{'default'} = [0];
469         # To have project specific config enable override in $GITWEB_CONFIG
470         # $feature{'patches'}{'override'} = 1;
471         # and in project config gitweb.patches = 0|n;
472         # where n is the maximum number of patches allowed in a patchset.
473         'patches' => {
474                 'sub' => \&feature_patches,
475                 'override' => 0,
476                 'default' => [16]},
477
478         # Avatar support. When this feature is enabled, views such as
479         # shortlog or commit will display an avatar associated with
480         # the email of the committer(s) and/or author(s).
481
482         # Currently available providers are gravatar and picon.
483         # If an unknown provider is specified, the feature is disabled.
484
485         # Gravatar depends on Digest::MD5.
486         # Picon currently relies on the indiana.edu database.
487
488         # To enable system wide have in $GITWEB_CONFIG
489         # $feature{'avatar'}{'default'} = ['<provider>'];
490         # where <provider> is either gravatar or picon.
491         # To have project specific config enable override in $GITWEB_CONFIG
492         # $feature{'avatar'}{'override'} = 1;
493         # and in project config gitweb.avatar = <provider>;
494         'avatar' => {
495                 'sub' => \&feature_avatar,
496                 'override' => 0,
497                 'default' => ['']},
498
499         # Enable displaying how much time and how many git commands
500         # it took to generate and display page.  Disabled by default.
501         # Project specific override is not supported.
502         'timed' => {
503                 'override' => 0,
504                 'default' => [0]},
505
506         # Enable turning some links into links to actions which require
507         # JavaScript to run (like 'blame_incremental').  Not enabled by
508         # default.  Project specific override is currently not supported.
509         'javascript-actions' => {
510                 'override' => 0,
511                 'default' => [0]},
512
513         # Enable and configure ability to change common timezone for dates
514         # in gitweb output via JavaScript.  Enabled by default.
515         # Project specific override is not supported.
516         'javascript-timezone' => {
517                 'override' => 0,
518                 'default' => [
519                         'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
520                                      # or undef to turn off this feature
521                         'gitweb_tz', # name of cookie where to store selected timezone
522                         'datetime',  # CSS class used to mark up dates for manipulation
523                 ]},
524
525         # Syntax highlighting support. This is based on Daniel Svensson's
526         # and Sham Chukoury's work in gitweb-xmms2.git.
527         # It requires the 'highlight' program present in $PATH,
528         # and therefore is disabled by default.
529
530         # To enable system wide have in $GITWEB_CONFIG
531         # $feature{'highlight'}{'default'} = [1];
532
533         'highlight' => {
534                 'sub' => sub { feature_bool('highlight', @_) },
535                 'override' => 0,
536                 'default' => [0]},
537
538         # Enable displaying of remote heads in the heads list
539
540         # To enable system wide have in $GITWEB_CONFIG
541         # $feature{'remote_heads'}{'default'} = [1];
542         # To have project specific config enable override in $GITWEB_CONFIG
543         # $feature{'remote_heads'}{'override'} = 1;
544         # and in project config gitweb.remote_heads = 0|1;
545         'remote_heads' => {
546                 'sub' => sub { feature_bool('remote_heads', @_) },
547                 'override' => 0,
548                 'default' => [0]},
549 );
550
551 sub gitweb_get_feature {
552         my ($name) = @_;
553         return unless exists $feature{$name};
554         my ($sub, $override, @defaults) = (
555                 $feature{$name}{'sub'},
556                 $feature{$name}{'override'},
557                 @{$feature{$name}{'default'}});
558         # project specific override is possible only if we have project
559         our $git_dir; # global variable, declared later
560         if (!$override || !defined $git_dir) {
561                 return @defaults;
562         }
563         if (!defined $sub) {
564                 warn "feature $name is not overridable";
565                 return @defaults;
566         }
567         return $sub->(@defaults);
568 }
569
570 # A wrapper to check if a given feature is enabled.
571 # With this, you can say
572 #
573 #   my $bool_feat = gitweb_check_feature('bool_feat');
574 #   gitweb_check_feature('bool_feat') or somecode;
575 #
576 # instead of
577 #
578 #   my ($bool_feat) = gitweb_get_feature('bool_feat');
579 #   (gitweb_get_feature('bool_feat'))[0] or somecode;
580 #
581 sub gitweb_check_feature {
582         return (gitweb_get_feature(@_))[0];
583 }
584
585
586 sub feature_bool {
587         my $key = shift;
588         my ($val) = git_get_project_config($key, '--bool');
589
590         if (!defined $val) {
591                 return ($_[0]);
592         } elsif ($val eq 'true') {
593                 return (1);
594         } elsif ($val eq 'false') {
595                 return (0);
596         }
597 }
598
599 sub feature_snapshot {
600         my (@fmts) = @_;
601
602         my ($val) = git_get_project_config('snapshot');
603
604         if ($val) {
605                 @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
606         }
607
608         return @fmts;
609 }
610
611 sub feature_patches {
612         my @val = (git_get_project_config('patches', '--int'));
613
614         if (@val) {
615                 return @val;
616         }
617
618         return ($_[0]);
619 }
620
621 sub feature_avatar {
622         my @val = (git_get_project_config('avatar'));
623
624         return @val ? @val : @_;
625 }
626
627 # checking HEAD file with -e is fragile if the repository was
628 # initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
629 # and then pruned.
630 sub check_head_link {
631         my ($dir) = @_;
632         my $headfile = "$dir/HEAD";
633         return ((-e $headfile) ||
634                 (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
635 }
636
637 sub check_export_ok {
638         my ($dir) = @_;
639         return (check_head_link($dir) &&
640                 (!$export_ok || -e "$dir/$export_ok") &&
641                 (!$export_auth_hook || $export_auth_hook->($dir)));
642 }
643
644 # process alternate names for backward compatibility
645 # filter out unsupported (unknown) snapshot formats
646 sub filter_snapshot_fmts {
647         my @fmts = @_;
648
649         @fmts = map {
650                 exists $known_snapshot_format_aliases{$_} ?
651                        $known_snapshot_format_aliases{$_} : $_} @fmts;
652         @fmts = grep {
653                 exists $known_snapshot_formats{$_} &&
654                 !$known_snapshot_formats{$_}{'disabled'}} @fmts;
655 }
656
657 # If it is set to code reference, it is code that it is to be run once per
658 # request, allowing updating configurations that change with each request,
659 # while running other code in config file only once.
660 #
661 # Otherwise, if it is false then gitweb would process config file only once;
662 # if it is true then gitweb config would be run for each request.
663 our $per_request_config = 1;
664
665 # read and parse gitweb config file given by its parameter.
666 # returns true on success, false on recoverable error, allowing
667 # to chain this subroutine, using first file that exists.
668 # dies on errors during parsing config file, as it is unrecoverable.
669 sub read_config_file {
670         my $filename = shift;
671         return unless defined $filename;
672         # die if there are errors parsing config file
673         if (-e $filename) {
674                 do $filename;
675                 die $@ if $@;
676                 return 1;
677         }
678         return;
679 }
680
681 our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
682 sub evaluate_gitweb_config {
683         our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
684         our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
685         our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
686
687         # Protect agains duplications of file names, to not read config twice.
688         # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
689         # there possibility of duplication of filename there doesn't matter.
690         $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
691         $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
692
693         # Common system-wide settings for convenience.
694         # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
695         read_config_file($GITWEB_CONFIG_COMMON);
696
697         # Use first config file that exists.  This means use the per-instance
698         # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
699         read_config_file($GITWEB_CONFIG) and return;
700         read_config_file($GITWEB_CONFIG_SYSTEM);
701 }
702
703 # Get loadavg of system, to compare against $maxload.
704 # Currently it requires '/proc/loadavg' present to get loadavg;
705 # if it is not present it returns 0, which means no load checking.
706 sub get_loadavg {
707         if( -e '/proc/loadavg' ){
708                 open my $fd, '<', '/proc/loadavg'
709                         or return 0;
710                 my @load = split(/\s+/, scalar <$fd>);
711                 close $fd;
712
713                 # The first three columns measure CPU and IO utilization of the last one,
714                 # five, and 10 minute periods.  The fourth column shows the number of
715                 # currently running processes and the total number of processes in the m/n
716                 # format.  The last column displays the last process ID used.
717                 return $load[0] || 0;
718         }
719         # additional checks for load average should go here for things that don't export
720         # /proc/loadavg
721
722         return 0;
723 }
724
725 # version of the core git binary
726 our $git_version;
727 sub evaluate_git_version {
728         our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
729         $number_of_git_cmds++;
730 }
731
732 sub check_loadavg {
733         if (defined $maxload && get_loadavg() > $maxload) {
734                 die_error(503, "The load average on the server is too high");
735         }
736 }
737
738 # ======================================================================
739 # input validation and dispatch
740
741 # input parameters can be collected from a variety of sources (presently, CGI
742 # and PATH_INFO), so we define an %input_params hash that collects them all
743 # together during validation: this allows subsequent uses (e.g. href()) to be
744 # agnostic of the parameter origin
745
746 our %input_params = ();
747
748 # input parameters are stored with the long parameter name as key. This will
749 # also be used in the href subroutine to convert parameters to their CGI
750 # equivalent, and since the href() usage is the most frequent one, we store
751 # the name -> CGI key mapping here, instead of the reverse.
752 #
753 # XXX: Warning: If you touch this, check the search form for updating,
754 # too.
755
756 our @cgi_param_mapping = (
757         project => "p",
758         action => "a",
759         file_name => "f",
760         file_parent => "fp",
761         hash => "h",
762         hash_parent => "hp",
763         hash_base => "hb",
764         hash_parent_base => "hpb",
765         page => "pg",
766         order => "o",
767         searchtext => "s",
768         searchtype => "st",
769         snapshot_format => "sf",
770         extra_options => "opt",
771         search_use_regexp => "sr",
772         ctag => "by_tag",
773         diff_style => "ds",
774         project_filter => "pf",
775         # this must be last entry (for manipulation from JavaScript)
776         javascript => "js"
777 );
778 our %cgi_param_mapping = @cgi_param_mapping;
779
780 # we will also need to know the possible actions, for validation
781 our %actions = (
782         "blame" => \&git_blame,
783         "blame_incremental" => \&git_blame_incremental,
784         "blame_data" => \&git_blame_data,
785         "blobdiff" => \&git_blobdiff,
786         "blobdiff_plain" => \&git_blobdiff_plain,
787         "blob" => \&git_blob,
788         "blob_plain" => \&git_blob_plain,
789         "commitdiff" => \&git_commitdiff,
790         "commitdiff_plain" => \&git_commitdiff_plain,
791         "commit" => \&git_commit,
792         "forks" => \&git_forks,
793         "heads" => \&git_heads,
794         "history" => \&git_history,
795         "log" => \&git_log,
796         "patch" => \&git_patch,
797         "patches" => \&git_patches,
798         "remotes" => \&git_remotes,
799         "rss" => \&git_rss,
800         "atom" => \&git_atom,
801         "search" => \&git_search,
802         "search_help" => \&git_search_help,
803         "shortlog" => \&git_shortlog,
804         "summary" => \&git_summary,
805         "tag" => \&git_tag,
806         "tags" => \&git_tags,
807         "tree" => \&git_tree,
808         "snapshot" => \&git_snapshot,
809         "object" => \&git_object,
810         # those below don't need $project
811         "opml" => \&git_opml,
812         "project_list" => \&git_project_list,
813         "project_index" => \&git_project_index,
814 );
815
816 # finally, we have the hash of allowed extra_options for the commands that
817 # allow them
818 our %allowed_options = (
819         "--no-merges" => [ qw(rss atom log shortlog history) ],
820 );
821
822 # fill %input_params with the CGI parameters. All values except for 'opt'
823 # should be single values, but opt can be an array. We should probably
824 # build an array of parameters that can be multi-valued, but since for the time
825 # being it's only this one, we just single it out
826 sub evaluate_query_params {
827         our $cgi;
828
829         while (my ($name, $symbol) = each %cgi_param_mapping) {
830                 if ($symbol eq 'opt') {
831                         $input_params{$name} = [ map { decode_utf8($_) } $cgi->param($symbol) ];
832                 } else {
833                         $input_params{$name} = decode_utf8($cgi->param($symbol));
834                 }
835         }
836 }
837
838 # now read PATH_INFO and update the parameter list for missing parameters
839 sub evaluate_path_info {
840         return if defined $input_params{'project'};
841         return if !$path_info;
842         $path_info =~ s,^/+,,;
843         return if !$path_info;
844
845         # find which part of PATH_INFO is project
846         my $project = $path_info;
847         $project =~ s,/+$,,;
848         while ($project && !check_head_link("$projectroot/$project")) {
849                 $project =~ s,/*[^/]*$,,;
850         }
851         return unless $project;
852         $input_params{'project'} = $project;
853
854         # do not change any parameters if an action is given using the query string
855         return if $input_params{'action'};
856         $path_info =~ s,^\Q$project\E/*,,;
857
858         # next, check if we have an action
859         my $action = $path_info;
860         $action =~ s,/.*$,,;
861         if (exists $actions{$action}) {
862                 $path_info =~ s,^$action/*,,;
863                 $input_params{'action'} = $action;
864         }
865
866         # list of actions that want hash_base instead of hash, but can have no
867         # pathname (f) parameter
868         my @wants_base = (
869                 'tree',
870                 'history',
871         );
872
873         # we want to catch, among others
874         # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
875         my ($parentrefname, $parentpathname, $refname, $pathname) =
876                 ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
877
878         # first, analyze the 'current' part
879         if (defined $pathname) {
880                 # we got "branch:filename" or "branch:dir/"
881                 # we could use git_get_type(branch:pathname), but:
882                 # - it needs $git_dir
883                 # - it does a git() call
884                 # - the convention of terminating directories with a slash
885                 #   makes it superfluous
886                 # - embedding the action in the PATH_INFO would make it even
887                 #   more superfluous
888                 $pathname =~ s,^/+,,;
889                 if (!$pathname || substr($pathname, -1) eq "/") {
890                         $input_params{'action'} ||= "tree";
891                         $pathname =~ s,/$,,;
892                 } else {
893                         # the default action depends on whether we had parent info
894                         # or not
895                         if ($parentrefname) {
896                                 $input_params{'action'} ||= "blobdiff_plain";
897                         } else {
898                                 $input_params{'action'} ||= "blob_plain";
899                         }
900                 }
901                 $input_params{'hash_base'} ||= $refname;
902                 $input_params{'file_name'} ||= $pathname;
903         } elsif (defined $refname) {
904                 # we got "branch". In this case we have to choose if we have to
905                 # set hash or hash_base.
906                 #
907                 # Most of the actions without a pathname only want hash to be
908                 # set, except for the ones specified in @wants_base that want
909                 # hash_base instead. It should also be noted that hand-crafted
910                 # links having 'history' as an action and no pathname or hash
911                 # set will fail, but that happens regardless of PATH_INFO.
912                 if (defined $parentrefname) {
913                         # if there is parent let the default be 'shortlog' action
914                         # (for http://git.example.com/repo.git/A..B links); if there
915                         # is no parent, dispatch will detect type of object and set
916                         # action appropriately if required (if action is not set)
917                         $input_params{'action'} ||= "shortlog";
918                 }
919                 if ($input_params{'action'} &&
920                     grep { $_ eq $input_params{'action'} } @wants_base) {
921                         $input_params{'hash_base'} ||= $refname;
922                 } else {
923                         $input_params{'hash'} ||= $refname;
924                 }
925         }
926
927         # next, handle the 'parent' part, if present
928         if (defined $parentrefname) {
929                 # a missing pathspec defaults to the 'current' filename, allowing e.g.
930                 # someproject/blobdiff/oldrev..newrev:/filename
931                 if ($parentpathname) {
932                         $parentpathname =~ s,^/+,,;
933                         $parentpathname =~ s,/$,,;
934                         $input_params{'file_parent'} ||= $parentpathname;
935                 } else {
936                         $input_params{'file_parent'} ||= $input_params{'file_name'};
937                 }
938                 # we assume that hash_parent_base is wanted if a path was specified,
939                 # or if the action wants hash_base instead of hash
940                 if (defined $input_params{'file_parent'} ||
941                         grep { $_ eq $input_params{'action'} } @wants_base) {
942                         $input_params{'hash_parent_base'} ||= $parentrefname;
943                 } else {
944                         $input_params{'hash_parent'} ||= $parentrefname;
945                 }
946         }
947
948         # for the snapshot action, we allow URLs in the form
949         # $project/snapshot/$hash.ext
950         # where .ext determines the snapshot and gets removed from the
951         # passed $refname to provide the $hash.
952         #
953         # To be able to tell that $refname includes the format extension, we
954         # require the following two conditions to be satisfied:
955         # - the hash input parameter MUST have been set from the $refname part
956         #   of the URL (i.e. they must be equal)
957         # - the snapshot format MUST NOT have been defined already (e.g. from
958         #   CGI parameter sf)
959         # It's also useless to try any matching unless $refname has a dot,
960         # so we check for that too
961         if (defined $input_params{'action'} &&
962                 $input_params{'action'} eq 'snapshot' &&
963                 defined $refname && index($refname, '.') != -1 &&
964                 $refname eq $input_params{'hash'} &&
965                 !defined $input_params{'snapshot_format'}) {
966                 # We loop over the known snapshot formats, checking for
967                 # extensions. Allowed extensions are both the defined suffix
968                 # (which includes the initial dot already) and the snapshot
969                 # format key itself, with a prepended dot
970                 while (my ($fmt, $opt) = each %known_snapshot_formats) {
971                         my $hash = $refname;
972                         unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
973                                 next;
974                         }
975                         my $sfx = $1;
976                         # a valid suffix was found, so set the snapshot format
977                         # and reset the hash parameter
978                         $input_params{'snapshot_format'} = $fmt;
979                         $input_params{'hash'} = $hash;
980                         # we also set the format suffix to the one requested
981                         # in the URL: this way a request for e.g. .tgz returns
982                         # a .tgz instead of a .tar.gz
983                         $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
984                         last;
985                 }
986         }
987 }
988
989 our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
990      $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
991      $searchtext, $search_regexp, $project_filter);
992 sub evaluate_and_validate_params {
993         our $action = $input_params{'action'};
994         if (defined $action) {
995                 if (!validate_action($action)) {
996                         die_error(400, "Invalid action parameter");
997                 }
998         }
999
1000         # parameters which are pathnames
1001         our $project = $input_params{'project'};
1002         if (defined $project) {
1003                 if (!validate_project($project)) {
1004                         undef $project;
1005                         die_error(404, "No such project");
1006                 }
1007         }
1008
1009         our $project_filter = $input_params{'project_filter'};
1010         if (defined $project_filter) {
1011                 if (!validate_pathname($project_filter)) {
1012                         die_error(404, "Invalid project_filter parameter");
1013                 }
1014         }
1015
1016         our $file_name = $input_params{'file_name'};
1017         if (defined $file_name) {
1018                 if (!validate_pathname($file_name)) {
1019                         die_error(400, "Invalid file parameter");
1020                 }
1021         }
1022
1023         our $file_parent = $input_params{'file_parent'};
1024         if (defined $file_parent) {
1025                 if (!validate_pathname($file_parent)) {
1026                         die_error(400, "Invalid file parent parameter");
1027                 }
1028         }
1029
1030         # parameters which are refnames
1031         our $hash = $input_params{'hash'};
1032         if (defined $hash) {
1033                 if (!validate_refname($hash)) {
1034                         die_error(400, "Invalid hash parameter");
1035                 }
1036         }
1037
1038         our $hash_parent = $input_params{'hash_parent'};
1039         if (defined $hash_parent) {
1040                 if (!validate_refname($hash_parent)) {
1041                         die_error(400, "Invalid hash parent parameter");
1042                 }
1043         }
1044
1045         our $hash_base = $input_params{'hash_base'};
1046         if (defined $hash_base) {
1047                 if (!validate_refname($hash_base)) {
1048                         die_error(400, "Invalid hash base parameter");
1049                 }
1050         }
1051
1052         our @extra_options = @{$input_params{'extra_options'}};
1053         # @extra_options is always defined, since it can only be (currently) set from
1054         # CGI, and $cgi->param() returns the empty array in array context if the param
1055         # is not set
1056         foreach my $opt (@extra_options) {
1057                 if (not exists $allowed_options{$opt}) {
1058                         die_error(400, "Invalid option parameter");
1059                 }
1060                 if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1061                         die_error(400, "Invalid option parameter for this action");
1062                 }
1063         }
1064
1065         our $hash_parent_base = $input_params{'hash_parent_base'};
1066         if (defined $hash_parent_base) {
1067                 if (!validate_refname($hash_parent_base)) {
1068                         die_error(400, "Invalid hash parent base parameter");
1069                 }
1070         }
1071
1072         # other parameters
1073         our $page = $input_params{'page'};
1074         if (defined $page) {
1075                 if ($page =~ m/[^0-9]/) {
1076                         die_error(400, "Invalid page parameter");
1077                 }
1078         }
1079
1080         our $searchtype = $input_params{'searchtype'};
1081         if (defined $searchtype) {
1082                 if ($searchtype =~ m/[^a-z]/) {
1083                         die_error(400, "Invalid searchtype parameter");
1084                 }
1085         }
1086
1087         our $search_use_regexp = $input_params{'search_use_regexp'};
1088
1089         our $searchtext = $input_params{'searchtext'};
1090         our $search_regexp;
1091         if (defined $searchtext) {
1092                 if (length($searchtext) < 2) {
1093                         die_error(403, "At least two characters are required for search parameter");
1094                 }
1095                 if ($search_use_regexp) {
1096                         $search_regexp = $searchtext;
1097                         if (!eval { qr/$search_regexp/; 1; }) {
1098                                 (my $error = $@) =~ s/ at \S+ line \d+.*\n?//;
1099                                 die_error(400, "Invalid search regexp '$search_regexp'",
1100                                           esc_html($error));
1101                         }
1102                 } else {
1103                         $search_regexp = quotemeta $searchtext;
1104                 }
1105         }
1106 }
1107
1108 # path to the current git repository
1109 our $git_dir;
1110 sub evaluate_git_dir {
1111         our $git_dir = "$projectroot/$project" if $project;
1112 }
1113
1114 our (@snapshot_fmts, $git_avatar);
1115 sub configure_gitweb_features {
1116         # list of supported snapshot formats
1117         our @snapshot_fmts = gitweb_get_feature('snapshot');
1118         @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1119
1120         # check that the avatar feature is set to a known provider name,
1121         # and for each provider check if the dependencies are satisfied.
1122         # if the provider name is invalid or the dependencies are not met,
1123         # reset $git_avatar to the empty string.
1124         our ($git_avatar) = gitweb_get_feature('avatar');
1125         if ($git_avatar eq 'gravatar') {
1126                 $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1127         } elsif ($git_avatar eq 'picon') {
1128                 # no dependencies
1129         } else {
1130                 $git_avatar = '';
1131         }
1132 }
1133
1134 # custom error handler: 'die <message>' is Internal Server Error
1135 sub handle_errors_html {
1136         my $msg = shift; # it is already HTML escaped
1137
1138         # to avoid infinite loop where error occurs in die_error,
1139         # change handler to default handler, disabling handle_errors_html
1140         set_message("Error occured when inside die_error:\n$msg");
1141
1142         # you cannot jump out of die_error when called as error handler;
1143         # the subroutine set via CGI::Carp::set_message is called _after_
1144         # HTTP headers are already written, so it cannot write them itself
1145         die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1146 }
1147 set_message(\&handle_errors_html);
1148
1149 # dispatch
1150 sub dispatch {
1151         if (!defined $action) {
1152                 if (defined $hash) {
1153                         $action = git_get_type($hash);
1154                         $action or die_error(404, "Object does not exist");
1155                 } elsif (defined $hash_base && defined $file_name) {
1156                         $action = git_get_type("$hash_base:$file_name");
1157                         $action or die_error(404, "File or directory does not exist");
1158                 } elsif (defined $project) {
1159                         $action = 'summary';
1160                 } else {
1161                         $action = 'project_list';
1162                 }
1163         }
1164         if (!defined($actions{$action})) {
1165                 die_error(400, "Unknown action");
1166         }
1167         if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1168             !$project) {
1169                 die_error(400, "Project needed");
1170         }
1171         $actions{$action}->();
1172 }
1173
1174 sub reset_timer {
1175         our $t0 = [ gettimeofday() ]
1176                 if defined $t0;
1177         our $number_of_git_cmds = 0;
1178 }
1179
1180 our $first_request = 1;
1181 sub run_request {
1182         reset_timer();
1183
1184         evaluate_uri();
1185         if ($first_request) {
1186                 evaluate_gitweb_config();
1187                 evaluate_git_version();
1188         }
1189         if ($per_request_config) {
1190                 if (ref($per_request_config) eq 'CODE') {
1191                         $per_request_config->();
1192                 } elsif (!$first_request) {
1193                         evaluate_gitweb_config();
1194                 }
1195         }
1196         check_loadavg();
1197
1198         # $projectroot and $projects_list might be set in gitweb config file
1199         $projects_list ||= $projectroot;
1200
1201         evaluate_query_params();
1202         evaluate_path_info();
1203         evaluate_and_validate_params();
1204         evaluate_git_dir();
1205
1206         configure_gitweb_features();
1207
1208         dispatch();
1209 }
1210
1211 our $is_last_request = sub { 1 };
1212 our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1213 our $CGI = 'CGI';
1214 our $cgi;
1215 sub configure_as_fcgi {
1216         require CGI::Fast;
1217         our $CGI = 'CGI::Fast';
1218
1219         my $request_number = 0;
1220         # let each child service 100 requests
1221         our $is_last_request = sub { ++$request_number > 100 };
1222 }
1223 sub evaluate_argv {
1224         my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1225         configure_as_fcgi()
1226                 if $script_name =~ /\.fcgi$/;
1227
1228         return unless (@ARGV);
1229
1230         require Getopt::Long;
1231         Getopt::Long::GetOptions(
1232                 'fastcgi|fcgi|f' => \&configure_as_fcgi,
1233                 'nproc|n=i' => sub {
1234                         my ($arg, $val) = @_;
1235                         return unless eval { require FCGI::ProcManager; 1; };
1236                         my $proc_manager = FCGI::ProcManager->new({
1237                                 n_processes => $val,
1238                         });
1239                         our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1240                         our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1241                         our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1242                 },
1243         );
1244 }
1245
1246 sub run {
1247         evaluate_argv();
1248
1249         $first_request = 1;
1250         $pre_listen_hook->()
1251                 if $pre_listen_hook;
1252
1253  REQUEST:
1254         while ($cgi = $CGI->new()) {
1255                 $pre_dispatch_hook->()
1256                         if $pre_dispatch_hook;
1257
1258                 run_request();
1259
1260                 $post_dispatch_hook->()
1261                         if $post_dispatch_hook;
1262                 $first_request = 0;
1263
1264                 last REQUEST if ($is_last_request->());
1265         }
1266
1267  DONE_GITWEB:
1268         1;
1269 }
1270
1271 run();
1272
1273 if (defined caller) {
1274         # wrapped in a subroutine processing requests,
1275         # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1276         return;
1277 } else {
1278         # pure CGI script, serving single request
1279         exit;
1280 }
1281
1282 ## ======================================================================
1283 ## action links
1284
1285 # possible values of extra options
1286 # -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1287 # -replay => 1      - start from a current view (replay with modifications)
1288 # -path_info => 0|1 - don't use/use path_info URL (if possible)
1289 # -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1290 sub href {
1291         my %params = @_;
1292         # default is to use -absolute url() i.e. $my_uri
1293         my $href = $params{-full} ? $my_url : $my_uri;
1294
1295         # implicit -replay, must be first of implicit params
1296         $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1297
1298         $params{'project'} = $project unless exists $params{'project'};
1299
1300         if ($params{-replay}) {
1301                 while (my ($name, $symbol) = each %cgi_param_mapping) {
1302                         if (!exists $params{$name}) {
1303                                 $params{$name} = $input_params{$name};
1304                         }
1305                 }
1306         }
1307
1308         my $use_pathinfo = gitweb_check_feature('pathinfo');
1309         if (defined $params{'project'} &&
1310             (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1311                 # try to put as many parameters as possible in PATH_INFO:
1312                 #   - project name
1313                 #   - action
1314                 #   - hash_parent or hash_parent_base:/file_parent
1315                 #   - hash or hash_base:/filename
1316                 #   - the snapshot_format as an appropriate suffix
1317
1318                 # When the script is the root DirectoryIndex for the domain,
1319                 # $href here would be something like http://gitweb.example.com/
1320                 # Thus, we strip any trailing / from $href, to spare us double
1321                 # slashes in the final URL
1322                 $href =~ s,/$,,;
1323
1324                 # Then add the project name, if present
1325                 $href .= "/".esc_path_info($params{'project'});
1326                 delete $params{'project'};
1327
1328                 # since we destructively absorb parameters, we keep this
1329                 # boolean that remembers if we're handling a snapshot
1330                 my $is_snapshot = $params{'action'} eq 'snapshot';
1331
1332                 # Summary just uses the project path URL, any other action is
1333                 # added to the URL
1334                 if (defined $params{'action'}) {
1335                         $href .= "/".esc_path_info($params{'action'})
1336                                 unless $params{'action'} eq 'summary';
1337                         delete $params{'action'};
1338                 }
1339
1340                 # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1341                 # stripping nonexistent or useless pieces
1342                 $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1343                         || $params{'hash_parent'} || $params{'hash'});
1344                 if (defined $params{'hash_base'}) {
1345                         if (defined $params{'hash_parent_base'}) {
1346                                 $href .= esc_path_info($params{'hash_parent_base'});
1347                                 # skip the file_parent if it's the same as the file_name
1348                                 if (defined $params{'file_parent'}) {
1349                                         if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1350                                                 delete $params{'file_parent'};
1351                                         } elsif ($params{'file_parent'} !~ /\.\./) {
1352                                                 $href .= ":/".esc_path_info($params{'file_parent'});
1353                                                 delete $params{'file_parent'};
1354                                         }
1355                                 }
1356                                 $href .= "..";
1357                                 delete $params{'hash_parent'};
1358                                 delete $params{'hash_parent_base'};
1359                         } elsif (defined $params{'hash_parent'}) {
1360                                 $href .= esc_path_info($params{'hash_parent'}). "..";
1361                                 delete $params{'hash_parent'};
1362                         }
1363
1364                         $href .= esc_path_info($params{'hash_base'});
1365                         if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1366                                 $href .= ":/".esc_path_info($params{'file_name'});
1367                                 delete $params{'file_name'};
1368                         }
1369                         delete $params{'hash'};
1370                         delete $params{'hash_base'};
1371                 } elsif (defined $params{'hash'}) {
1372                         $href .= esc_path_info($params{'hash'});
1373                         delete $params{'hash'};
1374                 }
1375
1376                 # If the action was a snapshot, we can absorb the
1377                 # snapshot_format parameter too
1378                 if ($is_snapshot) {
1379                         my $fmt = $params{'snapshot_format'};
1380                         # snapshot_format should always be defined when href()
1381                         # is called, but just in case some code forgets, we
1382                         # fall back to the default
1383                         $fmt ||= $snapshot_fmts[0];
1384                         $href .= $known_snapshot_formats{$fmt}{'suffix'};
1385                         delete $params{'snapshot_format'};
1386                 }
1387         }
1388
1389         # now encode the parameters explicitly
1390         my @result = ();
1391         for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1392                 my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1393                 if (defined $params{$name}) {
1394                         if (ref($params{$name}) eq "ARRAY") {
1395                                 foreach my $par (@{$params{$name}}) {
1396                                         push @result, $symbol . "=" . esc_param($par);
1397                                 }
1398                         } else {
1399                                 push @result, $symbol . "=" . esc_param($params{$name});
1400                         }
1401                 }
1402         }
1403         $href .= "?" . join(';', @result) if scalar @result;
1404
1405         # final transformation: trailing spaces must be escaped (URI-encoded)
1406         $href =~ s/(\s+)$/CGI::escape($1)/e;
1407
1408         if ($params{-anchor}) {
1409                 $href .= "#".esc_param($params{-anchor});
1410         }
1411
1412         return $href;
1413 }
1414
1415
1416 ## ======================================================================
1417 ## validation, quoting/unquoting and escaping
1418
1419 sub validate_action {
1420         my $input = shift || return undef;
1421         return undef unless exists $actions{$input};
1422         return $input;
1423 }
1424
1425 sub validate_project {
1426         my $input = shift || return undef;
1427         if (!validate_pathname($input) ||
1428                 !(-d "$projectroot/$input") ||
1429                 !check_export_ok("$projectroot/$input") ||
1430                 ($strict_export && !project_in_list($input))) {
1431                 return undef;
1432         } else {
1433                 return $input;
1434         }
1435 }
1436
1437 sub validate_pathname {
1438         my $input = shift || return undef;
1439
1440         # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1441         # at the beginning, at the end, and between slashes.
1442         # also this catches doubled slashes
1443         if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1444                 return undef;
1445         }
1446         # no null characters
1447         if ($input =~ m!\0!) {
1448                 return undef;
1449         }
1450         return $input;
1451 }
1452
1453 sub validate_refname {
1454         my $input = shift || return undef;
1455
1456         # textual hashes are O.K.
1457         if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1458                 return $input;
1459         }
1460         # it must be correct pathname
1461         $input = validate_pathname($input)
1462                 or return undef;
1463         # restrictions on ref name according to git-check-ref-format
1464         if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1465                 return undef;
1466         }
1467         return $input;
1468 }
1469
1470 # decode sequences of octets in utf8 into Perl's internal form,
1471 # which is utf-8 with utf8 flag set if needed.  gitweb writes out
1472 # in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1473 sub to_utf8 {
1474         my $str = shift;
1475         return undef unless defined $str;
1476
1477         if (utf8::is_utf8($str) || utf8::decode($str)) {
1478                 return $str;
1479         } else {
1480                 return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1481         }
1482 }
1483
1484 # quote unsafe chars, but keep the slash, even when it's not
1485 # correct, but quoted slashes look too horrible in bookmarks
1486 sub esc_param {
1487         my $str = shift;
1488         return undef unless defined $str;
1489         $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1490         $str =~ s/ /\+/g;
1491         return $str;
1492 }
1493
1494 # the quoting rules for path_info fragment are slightly different
1495 sub esc_path_info {
1496         my $str = shift;
1497         return undef unless defined $str;
1498
1499         # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1500         $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1501
1502         return $str;
1503 }
1504
1505 # quote unsafe chars in whole URL, so some characters cannot be quoted
1506 sub esc_url {
1507         my $str = shift;
1508         return undef unless defined $str;
1509         $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1510         $str =~ s/ /\+/g;
1511         return $str;
1512 }
1513
1514 # quote unsafe characters in HTML attributes
1515 sub esc_attr {
1516
1517         # for XHTML conformance escaping '"' to '&quot;' is not enough
1518         return esc_html(@_);
1519 }
1520
1521 # replace invalid utf8 character with SUBSTITUTION sequence
1522 sub esc_html {
1523         my $str = shift;
1524         my %opts = @_;
1525
1526         return undef unless defined $str;
1527
1528         $str = to_utf8($str);
1529         $str = $cgi->escapeHTML($str);
1530         if ($opts{'-nbsp'}) {
1531                 $str =~ s/ /&nbsp;/g;
1532         }
1533         $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1534         return $str;
1535 }
1536
1537 # quote control characters and escape filename to HTML
1538 sub esc_path {
1539         my $str = shift;
1540         my %opts = @_;
1541
1542         return undef unless defined $str;
1543
1544         $str = to_utf8($str);
1545         $str = $cgi->escapeHTML($str);
1546         if ($opts{'-nbsp'}) {
1547                 $str =~ s/ /&nbsp;/g;
1548         }
1549         $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1550         return $str;
1551 }
1552
1553 # Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1554 sub sanitize {
1555         my $str = shift;
1556
1557         return undef unless defined $str;
1558
1559         $str = to_utf8($str);
1560         $str =~ s|([[:cntrl:]])|($1 =~ /[\t\n\r]/ ? $1 : quot_cec($1))|eg;
1561         return $str;
1562 }
1563
1564 # Make control characters "printable", using character escape codes (CEC)
1565 sub quot_cec {
1566         my $cntrl = shift;
1567         my %opts = @_;
1568         my %es = ( # character escape codes, aka escape sequences
1569                 "\t" => '\t',   # tab            (HT)
1570                 "\n" => '\n',   # line feed      (LF)
1571                 "\r" => '\r',   # carrige return (CR)
1572                 "\f" => '\f',   # form feed      (FF)
1573                 "\b" => '\b',   # backspace      (BS)
1574                 "\a" => '\a',   # alarm (bell)   (BEL)
1575                 "\e" => '\e',   # escape         (ESC)
1576                 "\013" => '\v', # vertical tab   (VT)
1577                 "\000" => '\0', # nul character  (NUL)
1578         );
1579         my $chr = ( (exists $es{$cntrl})
1580                     ? $es{$cntrl}
1581                     : sprintf('\%2x', ord($cntrl)) );
1582         if ($opts{-nohtml}) {
1583                 return $chr;
1584         } else {
1585                 return "<span class=\"cntrl\">$chr</span>";
1586         }
1587 }
1588
1589 # Alternatively use unicode control pictures codepoints,
1590 # Unicode "printable representation" (PR)
1591 sub quot_upr {
1592         my $cntrl = shift;
1593         my %opts = @_;
1594
1595         my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1596         if ($opts{-nohtml}) {
1597                 return $chr;
1598         } else {
1599                 return "<span class=\"cntrl\">$chr</span>";
1600         }
1601 }
1602
1603 # git may return quoted and escaped filenames
1604 sub unquote {
1605         my $str = shift;
1606
1607         sub unq {
1608                 my $seq = shift;
1609                 my %es = ( # character escape codes, aka escape sequences
1610                         't' => "\t",   # tab            (HT, TAB)
1611                         'n' => "\n",   # newline        (NL)
1612                         'r' => "\r",   # return         (CR)
1613                         'f' => "\f",   # form feed      (FF)
1614                         'b' => "\b",   # backspace      (BS)
1615                         'a' => "\a",   # alarm (bell)   (BEL)
1616                         'e' => "\e",   # escape         (ESC)
1617                         'v' => "\013", # vertical tab   (VT)
1618                 );
1619
1620                 if ($seq =~ m/^[0-7]{1,3}$/) {
1621                         # octal char sequence
1622                         return chr(oct($seq));
1623                 } elsif (exists $es{$seq}) {
1624                         # C escape sequence, aka character escape code
1625                         return $es{$seq};
1626                 }
1627                 # quoted ordinary character
1628                 return $seq;
1629         }
1630
1631         if ($str =~ m/^"(.*)"$/) {
1632                 # needs unquoting
1633                 $str = $1;
1634                 $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1635         }
1636         return $str;
1637 }
1638
1639 # escape tabs (convert tabs to spaces)
1640 sub untabify {
1641         my $line = shift;
1642
1643         while ((my $pos = index($line, "\t")) != -1) {
1644                 if (my $count = (8 - ($pos % 8))) {
1645                         my $spaces = ' ' x $count;
1646                         $line =~ s/\t/$spaces/;
1647                 }
1648         }
1649
1650         return $line;
1651 }
1652
1653 sub project_in_list {
1654         my $project = shift;
1655         my @list = git_get_projects_list();
1656         return @list && scalar(grep { $_->{'path'} eq $project } @list);
1657 }
1658
1659 ## ----------------------------------------------------------------------
1660 ## HTML aware string manipulation
1661
1662 # Try to chop given string on a word boundary between position
1663 # $len and $len+$add_len. If there is no word boundary there,
1664 # chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1665 # (marking chopped part) would be longer than given string.
1666 sub chop_str {
1667         my $str = shift;
1668         my $len = shift;
1669         my $add_len = shift || 10;
1670         my $where = shift || 'right'; # 'left' | 'center' | 'right'
1671
1672         # Make sure perl knows it is utf8 encoded so we don't
1673         # cut in the middle of a utf8 multibyte char.
1674         $str = to_utf8($str);
1675
1676         # allow only $len chars, but don't cut a word if it would fit in $add_len
1677         # if it doesn't fit, cut it if it's still longer than the dots we would add
1678         # remove chopped character entities entirely
1679
1680         # when chopping in the middle, distribute $len into left and right part
1681         # return early if chopping wouldn't make string shorter
1682         if ($where eq 'center') {
1683                 return $str if ($len + 5 >= length($str)); # filler is length 5
1684                 $len = int($len/2);
1685         } else {
1686                 return $str if ($len + 4 >= length($str)); # filler is length 4
1687         }
1688
1689         # regexps: ending and beginning with word part up to $add_len
1690         my $endre = qr/.{$len}\w{0,$add_len}/;
1691         my $begre = qr/\w{0,$add_len}.{$len}/;
1692
1693         if ($where eq 'left') {
1694                 $str =~ m/^(.*?)($begre)$/;
1695                 my ($lead, $body) = ($1, $2);
1696                 if (length($lead) > 4) {
1697                         $lead = " ...";
1698                 }
1699                 return "$lead$body";
1700
1701         } elsif ($where eq 'center') {
1702                 $str =~ m/^($endre)(.*)$/;
1703                 my ($left, $str)  = ($1, $2);
1704                 $str =~ m/^(.*?)($begre)$/;
1705                 my ($mid, $right) = ($1, $2);
1706                 if (length($mid) > 5) {
1707                         $mid = " ... ";
1708                 }
1709                 return "$left$mid$right";
1710
1711         } else {
1712                 $str =~ m/^($endre)(.*)$/;
1713                 my $body = $1;
1714                 my $tail = $2;
1715                 if (length($tail) > 4) {
1716                         $tail = "... ";
1717                 }
1718                 return "$body$tail";
1719         }
1720 }
1721
1722 # takes the same arguments as chop_str, but also wraps a <span> around the
1723 # result with a title attribute if it does get chopped. Additionally, the
1724 # string is HTML-escaped.
1725 sub chop_and_escape_str {
1726         my ($str) = @_;
1727
1728         my $chopped = chop_str(@_);
1729         $str = to_utf8($str);
1730         if ($chopped eq $str) {
1731                 return esc_html($chopped);
1732         } else {
1733                 $str =~ s/[[:cntrl:]]/?/g;
1734                 return $cgi->span({-title=>$str}, esc_html($chopped));
1735         }
1736 }
1737
1738 # Highlight selected fragments of string, using given CSS class,
1739 # and escape HTML.  It is assumed that fragments do not overlap.
1740 # Regions are passed as list of pairs (array references).
1741 #
1742 # Example: esc_html_hl_regions("foobar", "mark", [ 0, 3 ]) returns
1743 # '<span class="mark">foo</span>bar'
1744 sub esc_html_hl_regions {
1745         my ($str, $css_class, @sel) = @_;
1746         my %opts = grep { ref($_) ne 'ARRAY' } @sel;
1747         @sel     = grep { ref($_) eq 'ARRAY' } @sel;
1748         return esc_html($str, %opts) unless @sel;
1749
1750         my $out = '';
1751         my $pos = 0;
1752
1753         for my $s (@sel) {
1754                 my ($begin, $end) = @$s;
1755
1756                 # Don't create empty <span> elements.
1757                 next if $end <= $begin;
1758
1759                 my $escaped = esc_html(substr($str, $begin, $end - $begin),
1760                                        %opts);
1761
1762                 $out .= esc_html(substr($str, $pos, $begin - $pos), %opts)
1763                         if ($begin - $pos > 0);
1764                 $out .= $cgi->span({-class => $css_class}, $escaped);
1765
1766                 $pos = $end;
1767         }
1768         $out .= esc_html(substr($str, $pos), %opts)
1769                 if ($pos < length($str));
1770
1771         return $out;
1772 }
1773
1774 # return positions of beginning and end of each match
1775 sub matchpos_list {
1776         my ($str, $regexp) = @_;
1777         return unless (defined $str && defined $regexp);
1778
1779         my @matches;
1780         while ($str =~ /$regexp/g) {
1781                 push @matches, [$-[0], $+[0]];
1782         }
1783         return @matches;
1784 }
1785
1786 # highlight match (if any), and escape HTML
1787 sub esc_html_match_hl {
1788         my ($str, $regexp) = @_;
1789         return esc_html($str) unless defined $regexp;
1790
1791         my @matches = matchpos_list($str, $regexp);
1792         return esc_html($str) unless @matches;
1793
1794         return esc_html_hl_regions($str, 'match', @matches);
1795 }
1796
1797
1798 # highlight match (if any) of shortened string, and escape HTML
1799 sub esc_html_match_hl_chopped {
1800         my ($str, $chopped, $regexp) = @_;
1801         return esc_html_match_hl($str, $regexp) unless defined $chopped;
1802
1803         my @matches = matchpos_list($str, $regexp);
1804         return esc_html($chopped) unless @matches;
1805
1806         # filter matches so that we mark chopped string
1807         my $tail = "... "; # see chop_str
1808         unless ($chopped =~ s/\Q$tail\E$//) {
1809                 $tail = '';
1810         }
1811         my $chop_len = length($chopped);
1812         my $tail_len = length($tail);
1813         my @filtered;
1814
1815         for my $m (@matches) {
1816                 if ($m->[0] > $chop_len) {
1817                         push @filtered, [ $chop_len, $chop_len + $tail_len ] if ($tail_len > 0);
1818                         last;
1819                 } elsif ($m->[1] > $chop_len) {
1820                         push @filtered, [ $m->[0], $chop_len + $tail_len ];
1821                         last;
1822                 }
1823                 push @filtered, $m;
1824         }
1825
1826         return esc_html_hl_regions($chopped . $tail, 'match', @filtered);
1827 }
1828
1829 ## ----------------------------------------------------------------------
1830 ## functions returning short strings
1831
1832 # CSS class for given age value (in seconds)
1833 sub age_class {
1834         my $age = shift;
1835
1836         if (!defined $age) {
1837                 return "noage";
1838         } elsif ($age < 60*60*2) {
1839                 return "age0";
1840         } elsif ($age < 60*60*24*2) {
1841                 return "age1";
1842         } else {
1843                 return "age2";
1844         }
1845 }
1846
1847 # convert age in seconds to "nn units ago" string
1848 sub age_string {
1849         my $age = shift;
1850         my $age_str;
1851
1852         if ($age > 60*60*24*365*2) {
1853                 $age_str = (int $age/60/60/24/365);
1854                 $age_str .= " years ago";
1855         } elsif ($age > 60*60*24*(365/12)*2) {
1856                 $age_str = int $age/60/60/24/(365/12);
1857                 $age_str .= " months ago";
1858         } elsif ($age > 60*60*24*7*2) {
1859                 $age_str = int $age/60/60/24/7;
1860                 $age_str .= " weeks ago";
1861         } elsif ($age > 60*60*24*2) {
1862                 $age_str = int $age/60/60/24;
1863                 $age_str .= " days ago";
1864         } elsif ($age > 60*60*2) {
1865                 $age_str = int $age/60/60;
1866                 $age_str .= " hours ago";
1867         } elsif ($age > 60*2) {
1868                 $age_str = int $age/60;
1869                 $age_str .= " min ago";
1870         } elsif ($age > 2) {
1871                 $age_str = int $age;
1872                 $age_str .= " sec ago";
1873         } else {
1874                 $age_str .= " right now";
1875         }
1876         return $age_str;
1877 }
1878
1879 use constant {
1880         S_IFINVALID => 0030000,
1881         S_IFGITLINK => 0160000,
1882 };
1883
1884 # submodule/subproject, a commit object reference
1885 sub S_ISGITLINK {
1886         my $mode = shift;
1887
1888         return (($mode & S_IFMT) == S_IFGITLINK)
1889 }
1890
1891 # convert file mode in octal to symbolic file mode string
1892 sub mode_str {
1893         my $mode = oct shift;
1894
1895         if (S_ISGITLINK($mode)) {
1896                 return 'm---------';
1897         } elsif (S_ISDIR($mode & S_IFMT)) {
1898                 return 'drwxr-xr-x';
1899         } elsif (S_ISLNK($mode)) {
1900                 return 'lrwxrwxrwx';
1901         } elsif (S_ISREG($mode)) {
1902                 # git cares only about the executable bit
1903                 if ($mode & S_IXUSR) {
1904                         return '-rwxr-xr-x';
1905                 } else {
1906                         return '-rw-r--r--';
1907                 };
1908         } else {
1909                 return '----------';
1910         }
1911 }
1912
1913 # convert file mode in octal to file type string
1914 sub file_type {
1915         my $mode = shift;
1916
1917         if ($mode !~ m/^[0-7]+$/) {
1918                 return $mode;
1919         } else {
1920                 $mode = oct $mode;
1921         }
1922
1923         if (S_ISGITLINK($mode)) {
1924                 return "submodule";
1925         } elsif (S_ISDIR($mode & S_IFMT)) {
1926                 return "directory";
1927         } elsif (S_ISLNK($mode)) {
1928                 return "symlink";
1929         } elsif (S_ISREG($mode)) {
1930                 return "file";
1931         } else {
1932                 return "unknown";
1933         }
1934 }
1935
1936 # convert file mode in octal to file type description string
1937 sub file_type_long {
1938         my $mode = shift;
1939
1940         if ($mode !~ m/^[0-7]+$/) {
1941                 return $mode;
1942         } else {
1943                 $mode = oct $mode;
1944         }
1945
1946         if (S_ISGITLINK($mode)) {
1947                 return "submodule";
1948         } elsif (S_ISDIR($mode & S_IFMT)) {
1949                 return "directory";
1950         } elsif (S_ISLNK($mode)) {
1951                 return "symlink";
1952         } elsif (S_ISREG($mode)) {
1953                 if ($mode & S_IXUSR) {
1954                         return "executable";
1955                 } else {
1956                         return "file";
1957                 };
1958         } else {
1959                 return "unknown";
1960         }
1961 }
1962
1963
1964 ## ----------------------------------------------------------------------
1965 ## functions returning short HTML fragments, or transforming HTML fragments
1966 ## which don't belong to other sections
1967
1968 # format line of commit message.
1969 sub format_log_line_html {
1970         my $line = shift;
1971
1972         $line = esc_html($line, -nbsp=>1);
1973         $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1974                 $cgi->a({-href => href(action=>"object", hash=>$1),
1975                                         -class => "text"}, $1);
1976         }eg;
1977
1978         return $line;
1979 }
1980
1981 # format marker of refs pointing to given object
1982
1983 # the destination action is chosen based on object type and current context:
1984 # - for annotated tags, we choose the tag view unless it's the current view
1985 #   already, in which case we go to shortlog view
1986 # - for other refs, we keep the current view if we're in history, shortlog or
1987 #   log view, and select shortlog otherwise
1988 sub format_ref_marker {
1989         my ($refs, $id) = @_;
1990         my $markers = '';
1991
1992         if (defined $refs->{$id}) {
1993                 foreach my $ref (@{$refs->{$id}}) {
1994                         # this code exploits the fact that non-lightweight tags are the
1995                         # only indirect objects, and that they are the only objects for which
1996                         # we want to use tag instead of shortlog as action
1997                         my ($type, $name) = qw();
1998                         my $indirect = ($ref =~ s/\^\{\}$//);
1999                         # e.g. tags/v2.6.11 or heads/next
2000                         if ($ref =~ m!^(.*?)s?/(.*)$!) {
2001                                 $type = $1;
2002                                 $name = $2;
2003                         } else {
2004                                 $type = "ref";
2005                                 $name = $ref;
2006                         }
2007
2008                         my $class = $type;
2009                         $class .= " indirect" if $indirect;
2010
2011                         my $dest_action = "shortlog";
2012
2013                         if ($indirect) {
2014                                 $dest_action = "tag" unless $action eq "tag";
2015                         } elsif ($action =~ /^(history|(short)?log)$/) {
2016                                 $dest_action = $action;
2017                         }
2018
2019                         my $dest = "";
2020                         $dest .= "refs/" unless $ref =~ m!^refs/!;
2021                         $dest .= $ref;
2022
2023                         my $link = $cgi->a({
2024                                 -href => href(
2025                                         action=>$dest_action,
2026                                         hash=>$dest
2027                                 )}, $name);
2028
2029                         $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
2030                                 $link . "</span>";
2031                 }
2032         }
2033
2034         if ($markers) {
2035                 return ' <span class="refs">'. $markers . '</span>';
2036         } else {
2037                 return "";
2038         }
2039 }
2040
2041 # format, perhaps shortened and with markers, title line
2042 sub format_subject_html {
2043         my ($long, $short, $href, $extra) = @_;
2044         $extra = '' unless defined($extra);
2045
2046         if (length($short) < length($long)) {
2047                 $long =~ s/[[:cntrl:]]/?/g;
2048                 return $cgi->a({-href => $href, -class => "list subject",
2049                                 -title => to_utf8($long)},
2050                        esc_html($short)) . $extra;
2051         } else {
2052                 return $cgi->a({-href => $href, -class => "list subject"},
2053                        esc_html($long)) . $extra;
2054         }
2055 }
2056
2057 # Rather than recomputing the url for an email multiple times, we cache it
2058 # after the first hit. This gives a visible benefit in views where the avatar
2059 # for the same email is used repeatedly (e.g. shortlog).
2060 # The cache is shared by all avatar engines (currently gravatar only), which
2061 # are free to use it as preferred. Since only one avatar engine is used for any
2062 # given page, there's no risk for cache conflicts.
2063 our %avatar_cache = ();
2064
2065 # Compute the picon url for a given email, by using the picon search service over at
2066 # http://www.cs.indiana.edu/picons/search.html
2067 sub picon_url {
2068         my $email = lc shift;
2069         if (!$avatar_cache{$email}) {
2070                 my ($user, $domain) = split('@', $email);
2071                 $avatar_cache{$email} =
2072                         "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
2073                         "$domain/$user/" .
2074                         "users+domains+unknown/up/single";
2075         }
2076         return $avatar_cache{$email};
2077 }
2078
2079 # Compute the gravatar url for a given email, if it's not in the cache already.
2080 # Gravatar stores only the part of the URL before the size, since that's the
2081 # one computationally more expensive. This also allows reuse of the cache for
2082 # different sizes (for this particular engine).
2083 sub gravatar_url {
2084         my $email = lc shift;
2085         my $size = shift;
2086         $avatar_cache{$email} ||=
2087                 "http://www.gravatar.com/avatar/" .
2088                         Digest::MD5::md5_hex($email) . "?s=";
2089         return $avatar_cache{$email} . $size;
2090 }
2091
2092 # Insert an avatar for the given $email at the given $size if the feature
2093 # is enabled.
2094 sub git_get_avatar {
2095         my ($email, %opts) = @_;
2096         my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
2097         my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
2098         $opts{-size} ||= 'default';
2099         my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
2100         my $url = "";
2101         if ($git_avatar eq 'gravatar') {
2102                 $url = gravatar_url($email, $size);
2103         } elsif ($git_avatar eq 'picon') {
2104                 $url = picon_url($email);
2105         }
2106         # Other providers can be added by extending the if chain, defining $url
2107         # as needed. If no variant puts something in $url, we assume avatars
2108         # are completely disabled/unavailable.
2109         if ($url) {
2110                 return $pre_white .
2111                        "<img width=\"$size\" " .
2112                             "class=\"avatar\" " .
2113                             "src=\"".esc_url($url)."\" " .
2114                             "alt=\"\" " .
2115                        "/>" . $post_white;
2116         } else {
2117                 return "";
2118         }
2119 }
2120
2121 sub format_search_author {
2122         my ($author, $searchtype, $displaytext) = @_;
2123         my $have_search = gitweb_check_feature('search');
2124
2125         if ($have_search) {
2126                 my $performed = "";
2127                 if ($searchtype eq 'author') {
2128                         $performed = "authored";
2129                 } elsif ($searchtype eq 'committer') {
2130                         $performed = "committed";
2131                 }
2132
2133                 return $cgi->a({-href => href(action=>"search", hash=>$hash,
2134                                 searchtext=>$author,
2135                                 searchtype=>$searchtype), class=>"list",
2136                                 title=>"Search for commits $performed by $author"},
2137                                 $displaytext);
2138
2139         } else {
2140                 return $displaytext;
2141         }
2142 }
2143
2144 # format the author name of the given commit with the given tag
2145 # the author name is chopped and escaped according to the other
2146 # optional parameters (see chop_str).
2147 sub format_author_html {
2148         my $tag = shift;
2149         my $co = shift;
2150         my $author = chop_and_escape_str($co->{'author_name'}, @_);
2151         return "<$tag class=\"author\">" .
2152                format_search_author($co->{'author_name'}, "author",
2153                        git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2154                        $author) .
2155                "</$tag>";
2156 }
2157
2158 # format git diff header line, i.e. "diff --(git|combined|cc) ..."
2159 sub format_git_diff_header_line {
2160         my $line = shift;
2161         my $diffinfo = shift;
2162         my ($from, $to) = @_;
2163
2164         if ($diffinfo->{'nparents'}) {
2165                 # combined diff
2166                 $line =~ s!^(diff (.*?) )"?.*$!$1!;
2167                 if ($to->{'href'}) {
2168                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2169                                          esc_path($to->{'file'}));
2170                 } else { # file was deleted (no href)
2171                         $line .= esc_path($to->{'file'});
2172                 }
2173         } else {
2174                 # "ordinary" diff
2175                 $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2176                 if ($from->{'href'}) {
2177                         $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2178                                          'a/' . esc_path($from->{'file'}));
2179                 } else { # file was added (no href)
2180                         $line .= 'a/' . esc_path($from->{'file'});
2181                 }
2182                 $line .= ' ';
2183                 if ($to->{'href'}) {
2184                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2185                                          'b/' . esc_path($to->{'file'}));
2186                 } else { # file was deleted
2187                         $line .= 'b/' . esc_path($to->{'file'});
2188                 }
2189         }
2190
2191         return "<div class=\"diff header\">$line</div>\n";
2192 }
2193
2194 # format extended diff header line, before patch itself
2195 sub format_extended_diff_header_line {
2196         my $line = shift;
2197         my $diffinfo = shift;
2198         my ($from, $to) = @_;
2199
2200         # match <path>
2201         if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2202                 $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2203                                        esc_path($from->{'file'}));
2204         }
2205         if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2206                 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2207                                  esc_path($to->{'file'}));
2208         }
2209         # match single <mode>
2210         if ($line =~ m/\s(\d{6})$/) {
2211                 $line .= '<span class="info"> (' .
2212                          file_type_long($1) .
2213                          ')</span>';
2214         }
2215         # match <hash>
2216         if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2217                 # can match only for combined diff
2218                 $line = 'index ';
2219                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2220                         if ($from->{'href'}[$i]) {
2221                                 $line .= $cgi->a({-href=>$from->{'href'}[$i],
2222                                                   -class=>"hash"},
2223                                                  substr($diffinfo->{'from_id'}[$i],0,7));
2224                         } else {
2225                                 $line .= '0' x 7;
2226                         }
2227                         # separator
2228                         $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2229                 }
2230                 $line .= '..';
2231                 if ($to->{'href'}) {
2232                         $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2233                                          substr($diffinfo->{'to_id'},0,7));
2234                 } else {
2235                         $line .= '0' x 7;
2236                 }
2237
2238         } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2239                 # can match only for ordinary diff
2240                 my ($from_link, $to_link);
2241                 if ($from->{'href'}) {
2242                         $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2243                                              substr($diffinfo->{'from_id'},0,7));
2244                 } else {
2245                         $from_link = '0' x 7;
2246                 }
2247                 if ($to->{'href'}) {
2248                         $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2249                                            substr($diffinfo->{'to_id'},0,7));
2250                 } else {
2251                         $to_link = '0' x 7;
2252                 }
2253                 my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2254                 $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2255         }
2256
2257         return $line . "<br/>\n";
2258 }
2259
2260 # format from-file/to-file diff header
2261 sub format_diff_from_to_header {
2262         my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2263         my $line;
2264         my $result = '';
2265
2266         $line = $from_line;
2267         #assert($line =~ m/^---/) if DEBUG;
2268         # no extra formatting for "^--- /dev/null"
2269         if (! $diffinfo->{'nparents'}) {
2270                 # ordinary (single parent) diff
2271                 if ($line =~ m!^--- "?a/!) {
2272                         if ($from->{'href'}) {
2273                                 $line = '--- a/' .
2274                                         $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2275                                                 esc_path($from->{'file'}));
2276                         } else {
2277                                 $line = '--- a/' .
2278                                         esc_path($from->{'file'});
2279                         }
2280                 }
2281                 $result .= qq!<div class="diff from_file">$line</div>\n!;
2282
2283         } else {
2284                 # combined diff (merge commit)
2285                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2286                         if ($from->{'href'}[$i]) {
2287                                 $line = '--- ' .
2288                                         $cgi->a({-href=>href(action=>"blobdiff",
2289                                                              hash_parent=>$diffinfo->{'from_id'}[$i],
2290                                                              hash_parent_base=>$parents[$i],
2291                                                              file_parent=>$from->{'file'}[$i],
2292                                                              hash=>$diffinfo->{'to_id'},
2293                                                              hash_base=>$hash,
2294                                                              file_name=>$to->{'file'}),
2295                                                  -class=>"path",
2296                                                  -title=>"diff" . ($i+1)},
2297                                                 $i+1) .
2298                                         '/' .
2299                                         $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2300                                                 esc_path($from->{'file'}[$i]));
2301                         } else {
2302                                 $line = '--- /dev/null';
2303                         }
2304                         $result .= qq!<div class="diff from_file">$line</div>\n!;
2305                 }
2306         }
2307
2308         $line = $to_line;
2309         #assert($line =~ m/^\+\+\+/) if DEBUG;
2310         # no extra formatting for "^+++ /dev/null"
2311         if ($line =~ m!^\+\+\+ "?b/!) {
2312                 if ($to->{'href'}) {
2313                         $line = '+++ b/' .
2314                                 $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2315                                         esc_path($to->{'file'}));
2316                 } else {
2317                         $line = '+++ b/' .
2318                                 esc_path($to->{'file'});
2319                 }
2320         }
2321         $result .= qq!<div class="diff to_file">$line</div>\n!;
2322
2323         return $result;
2324 }
2325
2326 # create note for patch simplified by combined diff
2327 sub format_diff_cc_simplified {
2328         my ($diffinfo, @parents) = @_;
2329         my $result = '';
2330
2331         $result .= "<div class=\"diff header\">" .
2332                    "diff --cc ";
2333         if (!is_deleted($diffinfo)) {
2334                 $result .= $cgi->a({-href => href(action=>"blob",
2335                                                   hash_base=>$hash,
2336                                                   hash=>$diffinfo->{'to_id'},
2337                                                   file_name=>$diffinfo->{'to_file'}),
2338                                     -class => "path"},
2339                                    esc_path($diffinfo->{'to_file'}));
2340         } else {
2341                 $result .= esc_path($diffinfo->{'to_file'});
2342         }
2343         $result .= "</div>\n" . # class="diff header"
2344                    "<div class=\"diff nodifferences\">" .
2345                    "Simple merge" .
2346                    "</div>\n"; # class="diff nodifferences"
2347
2348         return $result;
2349 }
2350
2351 sub diff_line_class {
2352         my ($line, $from, $to) = @_;
2353
2354         # ordinary diff
2355         my $num_sign = 1;
2356         # combined diff
2357         if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2358                 $num_sign = scalar @{$from->{'href'}};
2359         }
2360
2361         my @diff_line_classifier = (
2362                 { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2363                 { regexp => qr/^\\/,               class => "incomplete"  },
2364                 { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2365                 # classifier for context must come before classifier add/rem,
2366                 # or we would have to use more complicated regexp, for example
2367                 # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2368                 { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2369                 { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2370         );
2371         for my $clsfy (@diff_line_classifier) {
2372                 return $clsfy->{'class'}
2373                         if ($line =~ $clsfy->{'regexp'});
2374         }
2375
2376         # fallback
2377         return "";
2378 }
2379
2380 # assumes that $from and $to are defined and correctly filled,
2381 # and that $line holds a line of chunk header for unified diff
2382 sub format_unidiff_chunk_header {
2383         my ($line, $from, $to) = @_;
2384
2385         my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2386                 $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2387
2388         $from_lines = 0 unless defined $from_lines;
2389         $to_lines   = 0 unless defined $to_lines;
2390
2391         if ($from->{'href'}) {
2392                 $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2393                                      -class=>"list"}, $from_text);
2394         }
2395         if ($to->{'href'}) {
2396                 $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2397                                      -class=>"list"}, $to_text);
2398         }
2399         $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2400                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2401         return $line;
2402 }
2403
2404 # assumes that $from and $to are defined and correctly filled,
2405 # and that $line holds a line of chunk header for combined diff
2406 sub format_cc_diff_chunk_header {
2407         my ($line, $from, $to) = @_;
2408
2409         my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2410         my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2411
2412         @from_text = split(' ', $ranges);
2413         for (my $i = 0; $i < @from_text; ++$i) {
2414                 ($from_start[$i], $from_nlines[$i]) =
2415                         (split(',', substr($from_text[$i], 1)), 0);
2416         }
2417
2418         $to_text   = pop @from_text;
2419         $to_start  = pop @from_start;
2420         $to_nlines = pop @from_nlines;
2421
2422         $line = "<span class=\"chunk_info\">$prefix ";
2423         for (my $i = 0; $i < @from_text; ++$i) {
2424                 if ($from->{'href'}[$i]) {
2425                         $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2426                                           -class=>"list"}, $from_text[$i]);
2427                 } else {
2428                         $line .= $from_text[$i];
2429                 }
2430                 $line .= " ";
2431         }
2432         if ($to->{'href'}) {
2433                 $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2434                                   -class=>"list"}, $to_text);
2435         } else {
2436                 $line .= $to_text;
2437         }
2438         $line .= " $prefix</span>" .
2439                  "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2440         return $line;
2441 }
2442
2443 # process patch (diff) line (not to be used for diff headers),
2444 # returning HTML-formatted (but not wrapped) line.
2445 # If the line is passed as a reference, it is treated as HTML and not
2446 # esc_html()'ed.
2447 sub format_diff_line {
2448         my ($line, $diff_class, $from, $to) = @_;
2449
2450         if (ref($line)) {
2451                 $line = $$line;
2452         } else {
2453                 chomp $line;
2454                 $line = untabify($line);
2455
2456                 if ($from && $to && $line =~ m/^\@{2} /) {
2457                         $line = format_unidiff_chunk_header($line, $from, $to);
2458                 } elsif ($from && $to && $line =~ m/^\@{3}/) {
2459                         $line = format_cc_diff_chunk_header($line, $from, $to);
2460                 } else {
2461                         $line = esc_html($line, -nbsp=>1);
2462                 }
2463         }
2464
2465         my $diff_classes = "diff";
2466         $diff_classes .= " $diff_class" if ($diff_class);
2467         $line = "<div class=\"$diff_classes\">$line</div>\n";
2468
2469         return $line;
2470 }
2471
2472 # Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2473 # linked.  Pass the hash of the tree/commit to snapshot.
2474 sub format_snapshot_links {
2475         my ($hash) = @_;
2476         my $num_fmts = @snapshot_fmts;
2477         if ($num_fmts > 1) {
2478                 # A parenthesized list of links bearing format names.
2479                 # e.g. "snapshot (_tar.gz_ _zip_)"
2480                 return "snapshot (" . join(' ', map
2481                         $cgi->a({
2482                                 -href => href(
2483                                         action=>"snapshot",
2484                                         hash=>$hash,
2485                                         snapshot_format=>$_
2486                                 )
2487                         }, $known_snapshot_formats{$_}{'display'})
2488                 , @snapshot_fmts) . ")";
2489         } elsif ($num_fmts == 1) {
2490                 # A single "snapshot" link whose tooltip bears the format name.
2491                 # i.e. "_snapshot_"
2492                 my ($fmt) = @snapshot_fmts;
2493                 return
2494                         $cgi->a({
2495                                 -href => href(
2496                                         action=>"snapshot",
2497                                         hash=>$hash,
2498                                         snapshot_format=>$fmt
2499                                 ),
2500                                 -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2501                         }, "snapshot");
2502         } else { # $num_fmts == 0
2503                 return undef;
2504         }
2505 }
2506
2507 ## ......................................................................
2508 ## functions returning values to be passed, perhaps after some
2509 ## transformation, to other functions; e.g. returning arguments to href()
2510
2511 # returns hash to be passed to href to generate gitweb URL
2512 # in -title key it returns description of link
2513 sub get_feed_info {
2514         my $format = shift || 'Atom';
2515         my %res = (action => lc($format));
2516
2517         # feed links are possible only for project views
2518         return unless (defined $project);
2519         # some views should link to OPML, or to generic project feed,
2520         # or don't have specific feed yet (so they should use generic)
2521         return if (!$action || $action =~ /^(?:tags|heads|forks|tag|search)$/x);
2522
2523         my $branch;
2524         # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2525         # from tag links; this also makes possible to detect branch links
2526         if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2527             (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2528                 $branch = $1;
2529         }
2530         # find log type for feed description (title)
2531         my $type = 'log';
2532         if (defined $file_name) {
2533                 $type  = "history of $file_name";
2534                 $type .= "/" if ($action eq 'tree');
2535                 $type .= " on '$branch'" if (defined $branch);
2536         } else {
2537                 $type = "log of $branch" if (defined $branch);
2538         }
2539
2540         $res{-title} = $type;
2541         $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2542         $res{'file_name'} = $file_name;
2543
2544         return %res;
2545 }
2546
2547 ## ----------------------------------------------------------------------
2548 ## git utility subroutines, invoking git commands
2549
2550 # returns path to the core git executable and the --git-dir parameter as list
2551 sub git_cmd {
2552         $number_of_git_cmds++;
2553         return $GIT, '--git-dir='.$git_dir;
2554 }
2555
2556 # quote the given arguments for passing them to the shell
2557 # quote_command("command", "arg 1", "arg with ' and ! characters")
2558 # => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2559 # Try to avoid using this function wherever possible.
2560 sub quote_command {
2561         return join(' ',
2562                 map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2563 }
2564
2565 # get HEAD ref of given project as hash
2566 sub git_get_head_hash {
2567         return git_get_full_hash(shift, 'HEAD');
2568 }
2569
2570 sub git_get_full_hash {
2571         return git_get_hash(@_);
2572 }
2573
2574 sub git_get_short_hash {
2575         return git_get_hash(@_, '--short=7');
2576 }
2577
2578 sub git_get_hash {
2579         my ($project, $hash, @options) = @_;
2580         my $o_git_dir = $git_dir;
2581         my $retval = undef;
2582         $git_dir = "$projectroot/$project";
2583         if (open my $fd, '-|', git_cmd(), 'rev-parse',
2584             '--verify', '-q', @options, $hash) {
2585                 $retval = <$fd>;
2586                 chomp $retval if defined $retval;
2587                 close $fd;
2588         }
2589         if (defined $o_git_dir) {
2590                 $git_dir = $o_git_dir;
2591         }
2592         return $retval;
2593 }
2594
2595 # get type of given object
2596 sub git_get_type {
2597         my $hash = shift;
2598
2599         open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2600         my $type = <$fd>;
2601         close $fd or return;
2602         chomp $type;
2603         return $type;
2604 }
2605
2606 # repository configuration
2607 our $config_file = '';
2608 our %config;
2609
2610 # store multiple values for single key as anonymous array reference
2611 # single values stored directly in the hash, not as [ <value> ]
2612 sub hash_set_multi {
2613         my ($hash, $key, $value) = @_;
2614
2615         if (!exists $hash->{$key}) {
2616                 $hash->{$key} = $value;
2617         } elsif (!ref $hash->{$key}) {
2618                 $hash->{$key} = [ $hash->{$key}, $value ];
2619         } else {
2620                 push @{$hash->{$key}}, $value;
2621         }
2622 }
2623
2624 # return hash of git project configuration
2625 # optionally limited to some section, e.g. 'gitweb'
2626 sub git_parse_project_config {
2627         my $section_regexp = shift;
2628         my %config;
2629
2630         local $/ = "\0";
2631
2632         open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2633                 or return;
2634
2635         while (my $keyval = <$fh>) {
2636                 chomp $keyval;
2637                 my ($key, $value) = split(/\n/, $keyval, 2);
2638
2639                 hash_set_multi(\%config, $key, $value)
2640                         if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2641         }
2642         close $fh;
2643
2644         return %config;
2645 }
2646
2647 # convert config value to boolean: 'true' or 'false'
2648 # no value, number > 0, 'true' and 'yes' values are true
2649 # rest of values are treated as false (never as error)
2650 sub config_to_bool {
2651         my $val = shift;
2652
2653         return 1 if !defined $val;             # section.key
2654
2655         # strip leading and trailing whitespace
2656         $val =~ s/^\s+//;
2657         $val =~ s/\s+$//;
2658
2659         return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2660                 ($val =~ /^(?:true|yes)$/i));  # section.key = true
2661 }
2662
2663 # convert config value to simple decimal number
2664 # an optional value suffix of 'k', 'm', or 'g' will cause the value
2665 # to be multiplied by 1024, 1048576, or 1073741824
2666 sub config_to_int {
2667         my $val = shift;
2668
2669         # strip leading and trailing whitespace
2670         $val =~ s/^\s+//;
2671         $val =~ s/\s+$//;
2672
2673         if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2674                 $unit = lc($unit);
2675                 # unknown unit is treated as 1
2676                 return $num * ($unit eq 'g' ? 1073741824 :
2677                                $unit eq 'm' ?    1048576 :
2678                                $unit eq 'k' ?       1024 : 1);
2679         }
2680         return $val;
2681 }
2682
2683 # convert config value to array reference, if needed
2684 sub config_to_multi {
2685         my $val = shift;
2686
2687         return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2688 }
2689
2690 sub git_get_project_config {
2691         my ($key, $type) = @_;
2692
2693         return unless defined $git_dir;
2694
2695         # key sanity check
2696         return unless ($key);
2697         # only subsection, if exists, is case sensitive,
2698         # and not lowercased by 'git config -z -l'
2699         if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2700                 $key = join(".", lc($hi), $mi, lc($lo));
2701         } else {
2702                 $key = lc($key);
2703         }
2704         $key =~ s/^gitweb\.//;
2705         return if ($key =~ m/\W/);
2706
2707         # type sanity check
2708         if (defined $type) {
2709                 $type =~ s/^--//;
2710                 $type = undef
2711                         unless ($type eq 'bool' || $type eq 'int');
2712         }
2713
2714         # get config
2715         if (!defined $config_file ||
2716             $config_file ne "$git_dir/config") {
2717                 %config = git_parse_project_config('gitweb');
2718                 $config_file = "$git_dir/config";
2719         }
2720
2721         # check if config variable (key) exists
2722         return unless exists $config{"gitweb.$key"};
2723
2724         # ensure given type
2725         if (!defined $type) {
2726                 return $config{"gitweb.$key"};
2727         } elsif ($type eq 'bool') {
2728                 # backward compatibility: 'git config --bool' returns true/false
2729                 return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2730         } elsif ($type eq 'int') {
2731                 return config_to_int($config{"gitweb.$key"});
2732         }
2733         return $config{"gitweb.$key"};
2734 }
2735
2736 # get hash of given path at given ref
2737 sub git_get_hash_by_path {
2738         my $base = shift;
2739         my $path = shift || return undef;
2740         my $type = shift;
2741
2742         $path =~ s,/+$,,;
2743
2744         open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2745                 or die_error(500, "Open git-ls-tree failed");
2746         my $line = <$fd>;
2747         close $fd or return undef;
2748
2749         if (!defined $line) {
2750                 # there is no tree or hash given by $path at $base
2751                 return undef;
2752         }
2753
2754         #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2755         $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2756         if (defined $type && $type ne $2) {
2757                 # type doesn't match
2758                 return undef;
2759         }
2760         return $3;
2761 }
2762
2763 # get path of entry with given hash at given tree-ish (ref)
2764 # used to get 'from' filename for combined diff (merge commit) for renames
2765 sub git_get_path_by_hash {
2766         my $base = shift || return;
2767         my $hash = shift || return;
2768
2769         local $/ = "\0";
2770
2771         open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2772                 or return undef;
2773         while (my $line = <$fd>) {
2774                 chomp $line;
2775
2776                 #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2777                 #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2778                 if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2779                         close $fd;
2780                         return $1;
2781                 }
2782         }
2783         close $fd;
2784         return undef;
2785 }
2786
2787 ## ......................................................................
2788 ## git utility functions, directly accessing git repository
2789
2790 # get the value of config variable either from file named as the variable
2791 # itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2792 # configuration variable in the repository config file.
2793 sub git_get_file_or_project_config {
2794         my ($path, $name) = @_;
2795
2796         $git_dir = "$projectroot/$path";
2797         open my $fd, '<', "$git_dir/$name"
2798                 or return git_get_project_config($name);
2799         my $conf = <$fd>;
2800         close $fd;
2801         if (defined $conf) {
2802                 chomp $conf;
2803         }
2804         return $conf;
2805 }
2806
2807 sub git_get_project_description {
2808         my $path = shift;
2809         return git_get_file_or_project_config($path, 'description');
2810 }
2811
2812 sub git_get_project_category {
2813         my $path = shift;
2814         return git_get_file_or_project_config($path, 'category');
2815 }
2816
2817
2818 # supported formats:
2819 # * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2820 #   - if its contents is a number, use it as tag weight,
2821 #   - otherwise add a tag with weight 1
2822 # * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2823 #   the same value multiple times increases tag weight
2824 # * `gitweb.ctag' multi-valued repo config variable
2825 sub git_get_project_ctags {
2826         my $project = shift;
2827         my $ctags = {};
2828
2829         $git_dir = "$projectroot/$project";
2830         if (opendir my $dh, "$git_dir/ctags") {
2831                 my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2832                 foreach my $tagfile (@files) {
2833                         open my $ct, '<', $tagfile
2834                                 or next;
2835                         my $val = <$ct>;
2836                         chomp $val if $val;
2837                         close $ct;
2838
2839                         (my $ctag = $tagfile) =~ s#.*/##;
2840                         if ($val =~ /^\d+$/) {
2841                                 $ctags->{$ctag} = $val;
2842                         } else {
2843                                 $ctags->{$ctag} = 1;
2844                         }
2845                 }
2846                 closedir $dh;
2847
2848         } elsif (open my $fh, '<', "$git_dir/ctags") {
2849                 while (my $line = <$fh>) {
2850                         chomp $line;
2851                         $ctags->{$line}++ if $line;
2852                 }
2853                 close $fh;
2854
2855         } else {
2856                 my $taglist = config_to_multi(git_get_project_config('ctag'));
2857                 foreach my $tag (@$taglist) {
2858                         $ctags->{$tag}++;
2859                 }
2860         }
2861
2862         return $ctags;
2863 }
2864
2865 # return hash, where keys are content tags ('ctags'),
2866 # and values are sum of weights of given tag in every project
2867 sub git_gather_all_ctags {
2868         my $projects = shift;
2869         my $ctags = {};
2870
2871         foreach my $p (@$projects) {
2872                 foreach my $ct (keys %{$p->{'ctags'}}) {
2873                         $ctags->{$ct} += $p->{'ctags'}->{$ct};
2874                 }
2875         }
2876
2877         return $ctags;
2878 }
2879
2880 sub git_populate_project_tagcloud {
2881         my $ctags = shift;
2882
2883         # First, merge different-cased tags; tags vote on casing
2884         my %ctags_lc;
2885         foreach (keys %$ctags) {
2886                 $ctags_lc{lc $_}->{count} += $ctags->{$_};
2887                 if (not $ctags_lc{lc $_}->{topcount}
2888                     or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2889                         $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2890                         $ctags_lc{lc $_}->{topname} = $_;
2891                 }
2892         }
2893
2894         my $cloud;
2895         my $matched = $input_params{'ctag'};
2896         if (eval { require HTML::TagCloud; 1; }) {
2897                 $cloud = HTML::TagCloud->new;
2898                 foreach my $ctag (sort keys %ctags_lc) {
2899                         # Pad the title with spaces so that the cloud looks
2900                         # less crammed.
2901                         my $title = esc_html($ctags_lc{$ctag}->{topname});
2902                         $title =~ s/ /&nbsp;/g;
2903                         $title =~ s/^/&nbsp;/g;
2904                         $title =~ s/$/&nbsp;/g;
2905                         if (defined $matched && $matched eq $ctag) {
2906                                 $title = qq(<span class="match">$title</span>);
2907                         }
2908                         $cloud->add($title, href(project=>undef, ctag=>$ctag),
2909                                     $ctags_lc{$ctag}->{count});
2910                 }
2911         } else {
2912                 $cloud = {};
2913                 foreach my $ctag (keys %ctags_lc) {
2914                         my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2915                         if (defined $matched && $matched eq $ctag) {
2916                                 $title = qq(<span class="match">$title</span>);
2917                         }
2918                         $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2919                         $cloud->{$ctag}{ctag} =
2920                                 $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2921                 }
2922         }
2923         return $cloud;
2924 }
2925
2926 sub git_show_project_tagcloud {
2927         my ($cloud, $count) = @_;
2928         if (ref $cloud eq 'HTML::TagCloud') {
2929                 return $cloud->html_and_css($count);
2930         } else {
2931                 my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2932                 return
2933                         '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2934                         join (', ', map {
2935                                 $cloud->{$_}->{'ctag'}
2936                         } splice(@tags, 0, $count)) .
2937                         '</div>';
2938         }
2939 }
2940
2941 sub git_get_project_url_list {
2942         my $path = shift;
2943
2944         $git_dir = "$projectroot/$path";
2945         open my $fd, '<', "$git_dir/cloneurl"
2946                 or return wantarray ?
2947                 @{ config_to_multi(git_get_project_config('url')) } :
2948                    config_to_multi(git_get_project_config('url'));
2949         my @git_project_url_list = map { chomp; $_ } <$fd>;
2950         close $fd;
2951
2952         return wantarray ? @git_project_url_list : \@git_project_url_list;
2953 }
2954
2955 sub git_get_projects_list {
2956         my $filter = shift || '';
2957         my $paranoid = shift;
2958         my @list;
2959
2960         if (-d $projects_list) {
2961                 # search in directory
2962                 my $dir = $projects_list;
2963                 # remove the trailing "/"
2964                 $dir =~ s!/+$!!;
2965                 my $pfxlen = length("$dir");
2966                 my $pfxdepth = ($dir =~ tr!/!!);
2967                 # when filtering, search only given subdirectory
2968                 if ($filter && !$paranoid) {
2969                         $dir .= "/$filter";
2970                         $dir =~ s!/+$!!;
2971                 }
2972
2973                 File::Find::find({
2974                         follow_fast => 1, # follow symbolic links
2975                         follow_skip => 2, # ignore duplicates
2976                         dangling_symlinks => 0, # ignore dangling symlinks, silently
2977                         wanted => sub {
2978                                 # global variables
2979                                 our $project_maxdepth;
2980                                 our $projectroot;
2981                                 # skip project-list toplevel, if we get it.
2982                                 return if (m!^[/.]$!);
2983                                 # only directories can be git repositories
2984                                 return unless (-d $_);
2985                                 # don't traverse too deep (Find is super slow on os x)
2986                                 # $project_maxdepth excludes depth of $projectroot
2987                                 if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2988                                         $File::Find::prune = 1;
2989                                         return;
2990                                 }
2991
2992                                 my $path = substr($File::Find::name, $pfxlen + 1);
2993                                 # paranoidly only filter here
2994                                 if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
2995                                         next;
2996                                 }
2997                                 # we check related file in $projectroot
2998                                 if (check_export_ok("$projectroot/$path")) {
2999                                         push @list, { path => $path };
3000                                         $File::Find::prune = 1;
3001                                 }
3002                         },
3003                 }, "$dir");
3004
3005         } elsif (-f $projects_list) {
3006                 # read from file(url-encoded):
3007                 # 'git%2Fgit.git Linus+Torvalds'
3008                 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3009                 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3010                 open my $fd, '<', $projects_list or return;
3011         PROJECT:
3012                 while (my $line = <$fd>) {
3013                         chomp $line;
3014                         my ($path, $owner) = split ' ', $line;
3015                         $path = unescape($path);
3016                         $owner = unescape($owner);
3017                         if (!defined $path) {
3018                                 next;
3019                         }
3020                         # if $filter is rpovided, check if $path begins with $filter
3021                         if ($filter && $path !~ m!^\Q$filter\E/!) {
3022                                 next;
3023                         }
3024                         if (check_export_ok("$projectroot/$path")) {
3025                                 my $pr = {
3026                                         path => $path
3027                                 };
3028                                 if ($owner) {
3029                                         $pr->{'owner'} = to_utf8($owner);
3030                                 }
3031                                 push @list, $pr;
3032                         }
3033                 }
3034                 close $fd;
3035         }
3036         return @list;
3037 }
3038
3039 # written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
3040 # as side effects it sets 'forks' field to list of forks for forked projects
3041 sub filter_forks_from_projects_list {
3042         my $projects = shift;
3043
3044         my %trie; # prefix tree of directories (path components)
3045         # generate trie out of those directories that might contain forks
3046         foreach my $pr (@$projects) {
3047                 my $path = $pr->{'path'};
3048                 $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
3049                 next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
3050                 next unless ($path);      # skip '.git' repository: tests, git-instaweb
3051                 next unless (-d "$projectroot/$path"); # containing directory exists
3052                 $pr->{'forks'} = [];      # there can be 0 or more forks of project
3053
3054                 # add to trie
3055                 my @dirs = split('/', $path);
3056                 # walk the trie, until either runs out of components or out of trie
3057                 my $ref = \%trie;
3058                 while (scalar @dirs &&
3059                        exists($ref->{$dirs[0]})) {
3060                         $ref = $ref->{shift @dirs};
3061                 }
3062                 # create rest of trie structure from rest of components
3063                 foreach my $dir (@dirs) {
3064                         $ref = $ref->{$dir} = {};
3065                 }
3066                 # create end marker, store $pr as a data
3067                 $ref->{''} = $pr if (!exists $ref->{''});
3068         }
3069
3070         # filter out forks, by finding shortest prefix match for paths
3071         my @filtered;
3072  PROJECT:
3073         foreach my $pr (@$projects) {
3074                 # trie lookup
3075                 my $ref = \%trie;
3076         DIR:
3077                 foreach my $dir (split('/', $pr->{'path'})) {
3078                         if (exists $ref->{''}) {
3079                                 # found [shortest] prefix, is a fork - skip it
3080                                 push @{$ref->{''}{'forks'}}, $pr;
3081                                 next PROJECT;
3082                         }
3083                         if (!exists $ref->{$dir}) {
3084                                 # not in trie, cannot have prefix, not a fork
3085                                 push @filtered, $pr;
3086                                 next PROJECT;
3087                         }
3088                         # If the dir is there, we just walk one step down the trie.
3089                         $ref = $ref->{$dir};
3090                 }
3091                 # we ran out of trie
3092                 # (shouldn't happen: it's either no match, or end marker)
3093                 push @filtered, $pr;
3094         }
3095
3096         return @filtered;
3097 }
3098
3099 # note: fill_project_list_info must be run first,
3100 # for 'descr_long' and 'ctags' to be filled
3101 sub search_projects_list {
3102         my ($projlist, %opts) = @_;
3103         my $tagfilter  = $opts{'tagfilter'};
3104         my $search_re = $opts{'search_regexp'};
3105
3106         return @$projlist
3107                 unless ($tagfilter || $search_re);
3108
3109         # searching projects require filling to be run before it;
3110         fill_project_list_info($projlist,
3111                                $tagfilter  ? 'ctags' : (),
3112                                $search_re ? ('path', 'descr') : ());
3113         my @projects;
3114  PROJECT:
3115         foreach my $pr (@$projlist) {
3116
3117                 if ($tagfilter) {
3118                         next unless ref($pr->{'ctags'}) eq 'HASH';
3119                         next unless
3120                                 grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
3121                 }
3122
3123                 if ($search_re) {
3124                         next unless
3125                                 $pr->{'path'} =~ /$search_re/ ||
3126                                 $pr->{'descr_long'} =~ /$search_re/;
3127                 }
3128
3129                 push @projects, $pr;
3130         }
3131
3132         return @projects;
3133 }
3134
3135 our $gitweb_project_owner = undef;
3136 sub git_get_project_list_from_file {
3137
3138         return if (defined $gitweb_project_owner);
3139
3140         $gitweb_project_owner = {};
3141         # read from file (url-encoded):
3142         # 'git%2Fgit.git Linus+Torvalds'
3143         # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3144         # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3145         if (-f $projects_list) {
3146                 open(my $fd, '<', $projects_list);
3147                 while (my $line = <$fd>) {
3148                         chomp $line;
3149                         my ($pr, $ow) = split ' ', $line;
3150                         $pr = unescape($pr);
3151                         $ow = unescape($ow);
3152                         $gitweb_project_owner->{$pr} = to_utf8($ow);
3153                 }
3154                 close $fd;
3155         }
3156 }
3157
3158 sub git_get_project_owner {
3159         my $project = shift;
3160         my $owner;
3161
3162         return undef unless $project;
3163         $git_dir = "$projectroot/$project";
3164
3165         if (!defined $gitweb_project_owner) {
3166                 git_get_project_list_from_file();
3167         }
3168
3169         if (exists $gitweb_project_owner->{$project}) {
3170                 $owner = $gitweb_project_owner->{$project};
3171         }
3172         if (!defined $owner){
3173                 $owner = git_get_project_config('owner');
3174         }
3175         if (!defined $owner) {
3176                 $owner = get_file_owner("$git_dir");
3177         }
3178
3179         return $owner;
3180 }
3181
3182 sub git_get_last_activity {
3183         my ($path) = @_;
3184         my $fd;
3185
3186         $git_dir = "$projectroot/$path";
3187         open($fd, "-|", git_cmd(), 'for-each-ref',
3188              '--format=%(committer)',
3189              '--sort=-committerdate',
3190              '--count=1',
3191              'refs/heads') or return;
3192         my $most_recent = <$fd>;
3193         close $fd or return;
3194         if (defined $most_recent &&
3195             $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3196                 my $timestamp = $1;
3197                 my $age = time - $timestamp;
3198                 return ($age, age_string($age));
3199         }
3200         return (undef, undef);
3201 }
3202
3203 # Implementation note: when a single remote is wanted, we cannot use 'git
3204 # remote show -n' because that command always work (assuming it's a remote URL
3205 # if it's not defined), and we cannot use 'git remote show' because that would
3206 # try to make a network roundtrip. So the only way to find if that particular
3207 # remote is defined is to walk the list provided by 'git remote -v' and stop if
3208 # and when we find what we want.
3209 sub git_get_remotes_list {
3210         my $wanted = shift;
3211         my %remotes = ();
3212
3213         open my $fd, '-|' , git_cmd(), 'remote', '-v';
3214         return unless $fd;
3215         while (my $remote = <$fd>) {
3216                 chomp $remote;
3217                 $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3218                 next if $wanted and not $remote eq $wanted;
3219                 my ($url, $key) = ($1, $2);
3220
3221                 $remotes{$remote} ||= { 'heads' => () };
3222                 $remotes{$remote}{$key} = $url;
3223         }
3224         close $fd or return;
3225         return wantarray ? %remotes : \%remotes;
3226 }
3227
3228 # Takes a hash of remotes as first parameter and fills it by adding the
3229 # available remote heads for each of the indicated remotes.
3230 sub fill_remote_heads {
3231         my $remotes = shift;
3232         my @heads = map { "remotes/$_" } keys %$remotes;
3233         my @remoteheads = git_get_heads_list(undef, @heads);
3234         foreach my $remote (keys %$remotes) {
3235                 $remotes->{$remote}{'heads'} = [ grep {
3236                         $_->{'name'} =~ s!^$remote/!!
3237                         } @remoteheads ];
3238         }
3239 }
3240
3241 sub git_get_references {
3242         my $type = shift || "";
3243         my %refs;
3244         # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3245         # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3246         open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3247                 ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3248                 or return;
3249
3250         while (my $line = <$fd>) {
3251                 chomp $line;
3252                 if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3253                         if (defined $refs{$1}) {
3254                                 push @{$refs{$1}}, $2;
3255                         } else {
3256                                 $refs{$1} = [ $2 ];
3257                         }
3258                 }
3259         }
3260         close $fd or return;
3261         return \%refs;
3262 }
3263
3264 sub git_get_rev_name_tags {
3265         my $hash = shift || return undef;
3266
3267         open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3268                 or return;
3269         my $name_rev = <$fd>;
3270         close $fd;
3271
3272         if ($name_rev =~ m|^$hash tags/(.*)$|) {
3273                 return $1;
3274         } else {
3275                 # catches also '$hash undefined' output
3276                 return undef;
3277         }
3278 }
3279
3280 ## ----------------------------------------------------------------------
3281 ## parse to hash functions
3282
3283 sub parse_date {
3284         my $epoch = shift;
3285         my $tz = shift || "-0000";
3286
3287         my %date;
3288         my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3289         my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3290         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3291         $date{'hour'} = $hour;
3292         $date{'minute'} = $min;
3293         $date{'mday'} = $mday;
3294         $date{'day'} = $days[$wday];
3295         $date{'month'} = $months[$mon];
3296         $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3297                              $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3298         $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3299                              $mday, $months[$mon], $hour ,$min;
3300         $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3301                              1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3302
3303         my ($tz_sign, $tz_hour, $tz_min) =
3304                 ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3305         $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3306         my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3307         ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3308         $date{'hour_local'} = $hour;
3309         $date{'minute_local'} = $min;
3310         $date{'tz_local'} = $tz;
3311         $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3312                                   1900+$year, $mon+1, $mday,
3313                                   $hour, $min, $sec, $tz);
3314         return %date;
3315 }
3316
3317 sub parse_tag {
3318         my $tag_id = shift;
3319         my %tag;
3320         my @comment;
3321
3322         open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3323         $tag{'id'} = $tag_id;
3324         while (my $line = <$fd>) {
3325                 chomp $line;
3326                 if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3327                         $tag{'object'} = $1;
3328                 } elsif ($line =~ m/^type (.+)$/) {
3329                         $tag{'type'} = $1;
3330                 } elsif ($line =~ m/^tag (.+)$/) {
3331                         $tag{'name'} = $1;
3332                 } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3333                         $tag{'author'} = $1;
3334                         $tag{'author_epoch'} = $2;
3335                         $tag{'author_tz'} = $3;
3336                         if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3337                                 $tag{'author_name'}  = $1;
3338                                 $tag{'author_email'} = $2;
3339                         } else {
3340                                 $tag{'author_name'} = $tag{'author'};
3341                         }
3342                 } elsif ($line =~ m/--BEGIN/) {
3343                         push @comment, $line;
3344                         last;
3345                 } elsif ($line eq "") {
3346                         last;
3347                 }
3348         }
3349         push @comment, <$fd>;
3350         $tag{'comment'} = \@comment;
3351         close $fd or return;
3352         if (!defined $tag{'name'}) {
3353                 return
3354         };
3355         return %tag
3356 }
3357
3358 sub parse_commit_text {
3359         my ($commit_text, $withparents) = @_;
3360         my @commit_lines = split '\n', $commit_text;
3361         my %co;
3362
3363         pop @commit_lines; # Remove '\0'
3364
3365         if (! @commit_lines) {
3366                 return;
3367         }
3368
3369         my $header = shift @commit_lines;
3370         if ($header !~ m/^[0-9a-fA-F]{40}/) {
3371                 return;
3372         }
3373         ($co{'id'}, my @parents) = split ' ', $header;
3374         while (my $line = shift @commit_lines) {
3375                 last if $line eq "\n";
3376                 if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3377                         $co{'tree'} = $1;
3378                 } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3379                         push @parents, $1;
3380                 } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3381                         $co{'author'} = to_utf8($1);
3382                         $co{'author_epoch'} = $2;
3383                         $co{'author_tz'} = $3;
3384                         if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3385                                 $co{'author_name'}  = $1;
3386                                 $co{'author_email'} = $2;
3387                         } else {
3388                                 $co{'author_name'} = $co{'author'};
3389                         }
3390                 } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3391                         $co{'committer'} = to_utf8($1);
3392                         $co{'committer_epoch'} = $2;
3393                         $co{'committer_tz'} = $3;
3394                         if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3395                                 $co{'committer_name'}  = $1;
3396                                 $co{'committer_email'} = $2;
3397                         } else {
3398                                 $co{'committer_name'} = $co{'committer'};
3399                         }
3400                 }
3401         }
3402         if (!defined $co{'tree'}) {
3403                 return;
3404         };
3405         $co{'parents'} = \@parents;
3406         $co{'parent'} = $parents[0];
3407
3408         foreach my $title (@commit_lines) {
3409                 $title =~ s/^    //;
3410                 if ($title ne "") {
3411                         $co{'title'} = chop_str($title, 80, 5);
3412                         # remove leading stuff of merges to make the interesting part visible
3413                         if (length($title) > 50) {
3414                                 $title =~ s/^Automatic //;
3415                                 $title =~ s/^merge (of|with) /Merge ... /i;
3416                                 if (length($title) > 50) {
3417                                         $title =~ s/(http|rsync):\/\///;
3418                                 }
3419                                 if (length($title) > 50) {
3420                                         $title =~ s/(master|www|rsync)\.//;
3421                                 }
3422                                 if (length($title) > 50) {
3423                                         $title =~ s/kernel.org:?//;
3424                                 }
3425                                 if (length($title) > 50) {
3426                                         $title =~ s/\/pub\/scm//;
3427                                 }
3428                         }
3429                         $co{'title_short'} = chop_str($title, 50, 5);
3430                         last;
3431                 }
3432         }
3433         if (! defined $co{'title'} || $co{'title'} eq "") {
3434                 $co{'title'} = $co{'title_short'} = '(no commit message)';
3435         }
3436         # remove added spaces
3437         foreach my $line (@commit_lines) {
3438                 $line =~ s/^    //;
3439         }
3440         $co{'comment'} = \@commit_lines;
3441
3442         my $age = time - $co{'committer_epoch'};
3443         $co{'age'} = $age;
3444         $co{'age_string'} = age_string($age);
3445         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3446         if ($age > 60*60*24*7*2) {
3447                 $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3448                 $co{'age_string_age'} = $co{'age_string'};
3449         } else {
3450                 $co{'age_string_date'} = $co{'age_string'};
3451                 $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3452         }
3453         return %co;
3454 }
3455
3456 sub parse_commit {
3457         my ($commit_id) = @_;
3458         my %co;
3459
3460         local $/ = "\0";
3461
3462         open my $fd, "-|", git_cmd(), "rev-list",
3463                 "--parents",
3464                 "--header",
3465                 "--max-count=1",
3466                 $commit_id,
3467                 "--",
3468                 or die_error(500, "Open git-rev-list failed");
3469         %co = parse_commit_text(<$fd>, 1);
3470         close $fd;
3471
3472         return %co;
3473 }
3474
3475 sub parse_commits {
3476         my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3477         my @cos;
3478
3479         $maxcount ||= 1;
3480         $skip ||= 0;
3481
3482         local $/ = "\0";
3483
3484         open my $fd, "-|", git_cmd(), "rev-list",
3485                 "--header",
3486                 @args,
3487                 ("--max-count=" . $maxcount),
3488                 ("--skip=" . $skip),
3489                 @extra_options,
3490                 $commit_id,
3491                 "--",
3492                 ($filename ? ($filename) : ())
3493                 or die_error(500, "Open git-rev-list failed");
3494         while (my $line = <$fd>) {
3495                 my %co = parse_commit_text($line);
3496                 push @cos, \%co;
3497         }
3498         close $fd;
3499
3500         return wantarray ? @cos : \@cos;
3501 }
3502
3503 # parse line of git-diff-tree "raw" output
3504 sub parse_difftree_raw_line {
3505         my $line = shift;
3506         my %res;
3507
3508         # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3509         # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3510         if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3511                 $res{'from_mode'} = $1;
3512                 $res{'to_mode'} = $2;
3513                 $res{'from_id'} = $3;
3514                 $res{'to_id'} = $4;
3515                 $res{'status'} = $5;
3516                 $res{'similarity'} = $6;
3517                 if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3518                         ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3519                 } else {
3520                         $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3521                 }
3522         }
3523         # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3524         # combined diff (for merge commit)
3525         elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3526                 $res{'nparents'}  = length($1);
3527                 $res{'from_mode'} = [ split(' ', $2) ];
3528                 $res{'to_mode'} = pop @{$res{'from_mode'}};
3529                 $res{'from_id'} = [ split(' ', $3) ];
3530                 $res{'to_id'} = pop @{$res{'from_id'}};
3531                 $res{'status'} = [ split('', $4) ];
3532                 $res{'to_file'} = unquote($5);
3533         }
3534         # 'c512b523472485aef4fff9e57b229d9d243c967f'
3535         elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3536                 $res{'commit'} = $1;
3537         }
3538
3539         return wantarray ? %res : \%res;
3540 }
3541
3542 # wrapper: return parsed line of git-diff-tree "raw" output
3543 # (the argument might be raw line, or parsed info)
3544 sub parsed_difftree_line {
3545         my $line_or_ref = shift;
3546
3547         if (ref($line_or_ref) eq "HASH") {
3548                 # pre-parsed (or generated by hand)
3549                 return $line_or_ref;
3550         } else {
3551                 return parse_difftree_raw_line($line_or_ref);
3552         }
3553 }
3554
3555 # parse line of git-ls-tree output
3556 sub parse_ls_tree_line {
3557         my $line = shift;
3558         my %opts = @_;
3559         my %res;
3560
3561         if ($opts{'-l'}) {
3562                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3563                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3564
3565                 $res{'mode'} = $1;
3566                 $res{'type'} = $2;
3567                 $res{'hash'} = $3;
3568                 $res{'size'} = $4;
3569                 if ($opts{'-z'}) {
3570                         $res{'name'} = $5;
3571                 } else {
3572                         $res{'name'} = unquote($5);
3573                 }
3574         } else {
3575                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3576                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3577
3578                 $res{'mode'} = $1;
3579                 $res{'type'} = $2;
3580                 $res{'hash'} = $3;
3581                 if ($opts{'-z'}) {
3582                         $res{'name'} = $4;
3583                 } else {
3584                         $res{'name'} = unquote($4);
3585                 }
3586         }
3587
3588         return wantarray ? %res : \%res;
3589 }
3590
3591 # generates _two_ hashes, references to which are passed as 2 and 3 argument
3592 sub parse_from_to_diffinfo {
3593         my ($diffinfo, $from, $to, @parents) = @_;
3594
3595         if ($diffinfo->{'nparents'}) {
3596                 # combined diff
3597                 $from->{'file'} = [];
3598                 $from->{'href'} = [];
3599                 fill_from_file_info($diffinfo, @parents)
3600                         unless exists $diffinfo->{'from_file'};
3601                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3602                         $from->{'file'}[$i] =
3603                                 defined $diffinfo->{'from_file'}[$i] ?
3604                                         $diffinfo->{'from_file'}[$i] :
3605                                         $diffinfo->{'to_file'};
3606                         if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3607                                 $from->{'href'}[$i] = href(action=>"blob",
3608                                                            hash_base=>$parents[$i],
3609                                                            hash=>$diffinfo->{'from_id'}[$i],
3610                                                            file_name=>$from->{'file'}[$i]);
3611                         } else {
3612                                 $from->{'href'}[$i] = undef;
3613                         }
3614                 }
3615         } else {
3616                 # ordinary (not combined) diff
3617                 $from->{'file'} = $diffinfo->{'from_file'};
3618                 if ($diffinfo->{'status'} ne "A") { # not new (added) file
3619                         $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3620                                                hash=>$diffinfo->{'from_id'},
3621                                                file_name=>$from->{'file'});
3622                 } else {
3623                         delete $from->{'href'};
3624                 }
3625         }
3626
3627         $to->{'file'} = $diffinfo->{'to_file'};
3628         if (!is_deleted($diffinfo)) { # file exists in result
3629                 $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3630                                      hash=>$diffinfo->{'to_id'},
3631                                      file_name=>$to->{'file'});
3632         } else {
3633                 delete $to->{'href'};
3634         }
3635 }
3636
3637 ## ......................................................................
3638 ## parse to array of hashes functions
3639
3640 sub git_get_heads_list {
3641         my ($limit, @classes) = @_;
3642         @classes = ('heads') unless @classes;
3643         my @patterns = map { "refs/$_" } @classes;
3644         my @headslist;
3645
3646         open my $fd, '-|', git_cmd(), 'for-each-ref',
3647                 ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3648                 '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3649                 @patterns
3650                 or return;
3651         while (my $line = <$fd>) {
3652                 my %ref_item;
3653
3654                 chomp $line;
3655                 my ($refinfo, $committerinfo) = split(/\0/, $line);
3656                 my ($hash, $name, $title) = split(' ', $refinfo, 3);
3657                 my ($committer, $epoch, $tz) =
3658                         ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3659                 $ref_item{'fullname'}  = $name;
3660                 $name =~ s!^refs/(?:head|remote)s/!!;
3661
3662                 $ref_item{'name'}  = $name;
3663                 $ref_item{'id'}    = $hash;
3664                 $ref_item{'title'} = $title || '(no commit message)';
3665                 $ref_item{'epoch'} = $epoch;
3666                 if ($epoch) {
3667                         $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3668                 } else {
3669                         $ref_item{'age'} = "unknown";
3670                 }
3671
3672                 push @headslist, \%ref_item;
3673         }
3674         close $fd;
3675
3676         return wantarray ? @headslist : \@headslist;
3677 }
3678
3679 sub git_get_tags_list {
3680         my $limit = shift;
3681         my @tagslist;
3682
3683         open my $fd, '-|', git_cmd(), 'for-each-ref',
3684                 ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3685                 '--format=%(objectname) %(objecttype) %(refname) '.
3686                 '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3687                 'refs/tags'
3688                 or return;
3689         while (my $line = <$fd>) {
3690                 my %ref_item;
3691
3692                 chomp $line;
3693                 my ($refinfo, $creatorinfo) = split(/\0/, $line);
3694                 my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3695                 my ($creator, $epoch, $tz) =
3696                         ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3697                 $ref_item{'fullname'} = $name;
3698                 $name =~ s!^refs/tags/!!;
3699
3700                 $ref_item{'type'} = $type;
3701                 $ref_item{'id'} = $id;
3702                 $ref_item{'name'} = $name;
3703                 if ($type eq "tag") {
3704                         $ref_item{'subject'} = $title;
3705                         $ref_item{'reftype'} = $reftype;
3706                         $ref_item{'refid'}   = $refid;
3707                 } else {
3708                         $ref_item{'reftype'} = $type;
3709                         $ref_item{'refid'}   = $id;
3710                 }
3711
3712                 if ($type eq "tag" || $type eq "commit") {
3713                         $ref_item{'epoch'} = $epoch;
3714                         if ($epoch) {
3715                                 $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3716                         } else {
3717                                 $ref_item{'age'} = "unknown";
3718                         }
3719                 }
3720
3721                 push @tagslist, \%ref_item;
3722         }
3723         close $fd;
3724
3725         return wantarray ? @tagslist : \@tagslist;
3726 }
3727
3728 ## ----------------------------------------------------------------------
3729 ## filesystem-related functions
3730
3731 sub get_file_owner {
3732         my $path = shift;
3733
3734         my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3735         my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3736         if (!defined $gcos) {
3737                 return undef;
3738         }
3739         my $owner = $gcos;
3740         $owner =~ s/[,;].*$//;
3741         return to_utf8($owner);
3742 }
3743
3744 # assume that file exists
3745 sub insert_file {
3746         my $filename = shift;
3747
3748         open my $fd, '<', $filename;
3749         print map { to_utf8($_) } <$fd>;
3750         close $fd;
3751 }
3752
3753 ## ......................................................................
3754 ## mimetype related functions
3755
3756 sub mimetype_guess_file {
3757         my $filename = shift;
3758         my $mimemap = shift;
3759         -r $mimemap or return undef;
3760
3761         my %mimemap;
3762         open(my $mh, '<', $mimemap) or return undef;
3763         while (<$mh>) {
3764                 next if m/^#/; # skip comments
3765                 my ($mimetype, @exts) = split(/\s+/);
3766                 foreach my $ext (@exts) {
3767                         $mimemap{$ext} = $mimetype;
3768                 }
3769         }
3770         close($mh);
3771
3772         $filename =~ /\.([^.]*)$/;
3773         return $mimemap{$1};
3774 }
3775
3776 sub mimetype_guess {
3777         my $filename = shift;
3778         my $mime;
3779         $filename =~ /\./ or return undef;
3780
3781         if ($mimetypes_file) {
3782                 my $file = $mimetypes_file;
3783                 if ($file !~ m!^/!) { # if it is relative path
3784                         # it is relative to project
3785                         $file = "$projectroot/$project/$file";
3786                 }
3787                 $mime = mimetype_guess_file($filename, $file);
3788         }
3789         $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3790         return $mime;
3791 }
3792
3793 sub blob_mimetype {
3794         my $fd = shift;
3795         my $filename = shift;
3796
3797         if ($filename) {
3798                 my $mime = mimetype_guess($filename);
3799                 $mime and return $mime;
3800         }
3801
3802         # just in case
3803         return $default_blob_plain_mimetype unless $fd;
3804
3805         if (-T $fd) {
3806                 return 'text/plain';
3807         } elsif (! $filename) {
3808                 return 'application/octet-stream';
3809         } elsif ($filename =~ m/\.png$/i) {
3810                 return 'image/png';
3811         } elsif ($filename =~ m/\.gif$/i) {
3812                 return 'image/gif';
3813         } elsif ($filename =~ m/\.jpe?g$/i) {
3814                 return 'image/jpeg';
3815         } else {
3816                 return 'application/octet-stream';
3817         }
3818 }
3819
3820 sub blob_contenttype {
3821         my ($fd, $file_name, $type) = @_;
3822
3823         $type ||= blob_mimetype($fd, $file_name);
3824         if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3825                 $type .= "; charset=$default_text_plain_charset";
3826         }
3827
3828         return $type;
3829 }
3830
3831 # guess file syntax for syntax highlighting; return undef if no highlighting
3832 # the name of syntax can (in the future) depend on syntax highlighter used
3833 sub guess_file_syntax {
3834         my ($highlight, $mimetype, $file_name) = @_;
3835         return undef unless ($highlight && defined $file_name);
3836         my $basename = basename($file_name, '.in');
3837         return $highlight_basename{$basename}
3838                 if exists $highlight_basename{$basename};
3839
3840         $basename =~ /\.([^.]*)$/;
3841         my $ext = $1 or return undef;
3842         return $highlight_ext{$ext}
3843                 if exists $highlight_ext{$ext};
3844
3845         return undef;
3846 }
3847
3848 # run highlighter and return FD of its output,
3849 # or return original FD if no highlighting
3850 sub run_highlighter {
3851         my ($fd, $highlight, $syntax) = @_;
3852         return $fd unless ($highlight && defined $syntax);
3853
3854         close $fd;
3855         open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3856                   quote_command($highlight_bin).
3857                   " --replace-tabs=8 --fragment --syntax $syntax |"
3858                 or die_error(500, "Couldn't open file or run syntax highlighter");
3859         return $fd;
3860 }
3861
3862 ## ======================================================================
3863 ## functions printing HTML: header, footer, error page
3864
3865 sub get_page_title {
3866         my $title = to_utf8($site_name);
3867
3868         unless (defined $project) {
3869                 if (defined $project_filter) {
3870                         $title .= " - projects in '" . esc_path($project_filter) . "'";
3871                 }
3872                 return $title;
3873         }
3874         $title .= " - " . to_utf8($project);
3875
3876         return $title unless (defined $action);
3877         $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3878
3879         return $title unless (defined $file_name);
3880         $title .= " - " . esc_path($file_name);
3881         if ($action eq "tree" && $file_name !~ m|/$|) {
3882                 $title .= "/";
3883         }
3884
3885         return $title;
3886 }
3887
3888 sub get_content_type_html {
3889         # require explicit support from the UA if we are to send the page as
3890         # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3891         # we have to do this because MSIE sometimes globs '*/*', pretending to
3892         # support xhtml+xml but choking when it gets what it asked for.
3893         if (defined $cgi->http('HTTP_ACCEPT') &&
3894             $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3895             $cgi->Accept('application/xhtml+xml') != 0) {
3896                 return 'application/xhtml+xml';
3897         } else {
3898                 return 'text/html';
3899         }
3900 }
3901
3902 sub print_feed_meta {
3903         if (defined $project) {
3904                 my %href_params = get_feed_info();
3905                 if (!exists $href_params{'-title'}) {
3906                         $href_params{'-title'} = 'log';
3907                 }
3908
3909                 foreach my $format (qw(RSS Atom)) {
3910                         my $type = lc($format);
3911                         my %link_attr = (
3912                                 '-rel' => 'alternate',
3913                                 '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3914                                 '-type' => "application/$type+xml"
3915                         );
3916
3917                         $href_params{'extra_options'} = undef;
3918                         $href_params{'action'} = $type;
3919                         $link_attr{'-href'} = href(%href_params);
3920                         print "<link ".
3921                               "rel=\"$link_attr{'-rel'}\" ".
3922                               "title=\"$link_attr{'-title'}\" ".
3923                               "href=\"$link_attr{'-href'}\" ".
3924                               "type=\"$link_attr{'-type'}\" ".
3925                               "/>\n";
3926
3927                         $href_params{'extra_options'} = '--no-merges';
3928                         $link_attr{'-href'} = href(%href_params);
3929                         $link_attr{'-title'} .= ' (no merges)';
3930                         print "<link ".
3931                               "rel=\"$link_attr{'-rel'}\" ".
3932                               "title=\"$link_attr{'-title'}\" ".
3933                               "href=\"$link_attr{'-href'}\" ".
3934                               "type=\"$link_attr{'-type'}\" ".
3935                               "/>\n";
3936                 }
3937
3938         } else {
3939                 printf('<link rel="alternate" title="%s projects list" '.
3940                        'href="%s" type="text/plain; charset=utf-8" />'."\n",
3941                        esc_attr($site_name), href(project=>undef, action=>"project_index"));
3942                 printf('<link rel="alternate" title="%s projects feeds" '.
3943                        'href="%s" type="text/x-opml" />'."\n",
3944                        esc_attr($site_name), href(project=>undef, action=>"opml"));
3945         }
3946 }
3947
3948 sub print_header_links {
3949         my $status = shift;
3950
3951         # print out each stylesheet that exist, providing backwards capability
3952         # for those people who defined $stylesheet in a config file
3953         if (defined $stylesheet) {
3954                 print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3955         } else {
3956                 foreach my $stylesheet (@stylesheets) {
3957                         next unless $stylesheet;
3958                         print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3959                 }
3960         }
3961         print_feed_meta()
3962                 if ($status eq '200 OK');
3963         if (defined $favicon) {
3964                 print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3965         }
3966 }
3967
3968 sub print_nav_breadcrumbs_path {
3969         my $dirprefix = undef;
3970         while (my $part = shift) {
3971                 $dirprefix .= "/" if defined $dirprefix;
3972                 $dirprefix .= $part;
3973                 print $cgi->a({-href => href(project => undef,
3974                                              project_filter => $dirprefix,
3975                                              action => "project_list")},
3976                               esc_html($part)) . " / ";
3977         }
3978 }
3979
3980 sub print_nav_breadcrumbs {
3981         my %opts = @_;
3982
3983         print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3984         if (defined $project) {
3985                 my @dirname = split '/', $project;
3986                 my $projectbasename = pop @dirname;
3987                 print_nav_breadcrumbs_path(@dirname);
3988                 print $cgi->a({-href => href(action=>"summary")}, esc_html($projectbasename));
3989                 if (defined $action) {
3990                         my $action_print = $action ;
3991                         if (defined $opts{-action_extra}) {
3992                                 $action_print = $cgi->a({-href => href(action=>$action)},
3993                                         $action);
3994                         }
3995                         print " / $action_print";
3996                 }
3997                 if (defined $opts{-action_extra}) {
3998                         print " / $opts{-action_extra}";
3999                 }
4000                 print "\n";
4001         } elsif (defined $project_filter) {
4002                 print_nav_breadcrumbs_path(split '/', $project_filter);
4003         }
4004 }
4005
4006 sub print_search_form {
4007         if (!defined $searchtext) {
4008                 $searchtext = "";
4009         }
4010         my $search_hash;
4011         if (defined $hash_base) {
4012                 $search_hash = $hash_base;
4013         } elsif (defined $hash) {
4014                 $search_hash = $hash;
4015         } else {
4016                 $search_hash = "HEAD";
4017         }
4018         my $action = $my_uri;
4019         my $use_pathinfo = gitweb_check_feature('pathinfo');
4020         if ($use_pathinfo) {
4021                 $action .= "/".esc_url($project);
4022         }
4023         print $cgi->startform(-method => "get", -action => $action) .
4024               "<div class=\"search\">\n" .
4025               (!$use_pathinfo &&
4026               $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
4027               $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
4028               $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
4029               $cgi->popup_menu(-name => 'st', -default => 'commit',
4030                                -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
4031               $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
4032               " search:\n",
4033               $cgi->textfield(-name => "s", -value => $searchtext, -override => 1) . "\n" .
4034               "<span title=\"Extended regular expression\">" .
4035               $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
4036                              -checked => $search_use_regexp) .
4037               "</span>" .
4038               "</div>" .
4039               $cgi->end_form() . "\n";
4040 }
4041
4042 sub git_header_html {
4043         my $status = shift || "200 OK";
4044         my $expires = shift;
4045         my %opts = @_;
4046
4047         my $title = get_page_title();
4048         my $content_type = get_content_type_html();
4049         print $cgi->header(-type=>$content_type, -charset => 'utf-8',
4050                            -status=> $status, -expires => $expires)
4051                 unless ($opts{'-no_http_header'});
4052         my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
4053         print <<EOF;
4054 <?xml version="1.0" encoding="utf-8"?>
4055 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
4056 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
4057 <!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
4058 <!-- git core binaries version $git_version -->
4059 <head>
4060 <meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
4061 <meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
4062 <meta name="robots" content="index, nofollow"/>
4063 <title>$title</title>
4064 EOF
4065         # the stylesheet, favicon etc urls won't work correctly with path_info
4066         # unless we set the appropriate base URL
4067         if ($ENV{'PATH_INFO'}) {
4068                 print "<base href=\"".esc_url($base_url)."\" />\n";
4069         }
4070         print_header_links($status);
4071
4072         if (defined $site_html_head_string) {
4073                 print to_utf8($site_html_head_string);
4074         }
4075
4076         print "</head>\n" .
4077               "<body>\n";
4078
4079         if (defined $site_header && -f $site_header) {
4080                 insert_file($site_header);
4081         }
4082
4083         print "<div class=\"page_header\">\n";
4084         if (defined $logo) {
4085                 print $cgi->a({-href => esc_url($logo_url),
4086                                -title => $logo_label},
4087                               $cgi->img({-src => esc_url($logo),
4088                                          -width => 72, -height => 27,
4089                                          -alt => "git",
4090                                          -class => "logo"}));
4091         }
4092         print_nav_breadcrumbs(%opts);
4093         print "</div>\n";
4094
4095         my $have_search = gitweb_check_feature('search');
4096         if (defined $project && $have_search) {
4097                 print_search_form();
4098         }
4099 }
4100
4101 sub git_footer_html {
4102         my $feed_class = 'rss_logo';
4103
4104         print "<div class=\"page_footer\">\n";
4105         if (defined $project) {
4106                 my $descr = git_get_project_description($project);
4107                 if (defined $descr) {
4108                         print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
4109                 }
4110
4111                 my %href_params = get_feed_info();
4112                 if (!%href_params) {
4113                         $feed_class .= ' generic';
4114                 }
4115                 $href_params{'-title'} ||= 'log';
4116
4117                 foreach my $format (qw(RSS Atom)) {
4118                         $href_params{'action'} = lc($format);
4119                         print $cgi->a({-href => href(%href_params),
4120                                       -title => "$href_params{'-title'} $format feed",
4121                                       -class => $feed_class}, $format)."\n";
4122                 }
4123
4124         } else {
4125                 print $cgi->a({-href => href(project=>undef, action=>"opml",
4126                                              project_filter => $project_filter),
4127                               -class => $feed_class}, "OPML") . " ";
4128                 print $cgi->a({-href => href(project=>undef, action=>"project_index",
4129                                              project_filter => $project_filter),
4130                               -class => $feed_class}, "TXT") . "\n";
4131         }
4132         print "</div>\n"; # class="page_footer"
4133
4134         if (defined $t0 && gitweb_check_feature('timed')) {
4135                 print "<div id=\"generating_info\">\n";
4136                 print 'This page took '.
4137                       '<span id="generating_time" class="time_span">'.
4138                       tv_interval($t0, [ gettimeofday() ]).
4139                       ' seconds </span>'.
4140                       ' and '.
4141                       '<span id="generating_cmd">'.
4142                       $number_of_git_cmds.
4143                       '</span> git commands '.
4144                       " to generate.\n";
4145                 print "</div>\n"; # class="page_footer"
4146         }
4147
4148         if (defined $site_footer && -f $site_footer) {
4149                 insert_file($site_footer);
4150         }
4151
4152         print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
4153         if (defined $action &&
4154             $action eq 'blame_incremental') {
4155                 print qq!<script type="text/javascript">\n!.
4156                       qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
4157                       qq!           "!. href() .qq!");\n!.
4158                       qq!</script>\n!;
4159         } else {
4160                 my ($jstimezone, $tz_cookie, $datetime_class) =
4161                         gitweb_get_feature('javascript-timezone');
4162
4163                 print qq!<script type="text/javascript">\n!.
4164                       qq!window.onload = function () {\n!;
4165                 if (gitweb_check_feature('javascript-actions')) {
4166                         print qq!       fixLinks();\n!;
4167                 }
4168                 if ($jstimezone && $tz_cookie && $datetime_class) {
4169                         print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4170                               qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4171                 }
4172                 print qq!};\n!.
4173                       qq!</script>\n!;
4174         }
4175
4176         print "</body>\n" .
4177               "</html>";
4178 }
4179
4180 # die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4181 # Example: die_error(404, 'Hash not found')
4182 # By convention, use the following status codes (as defined in RFC 2616):
4183 # 400: Invalid or missing CGI parameters, or
4184 #      requested object exists but has wrong type.
4185 # 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4186 #      this server or project.
4187 # 404: Requested object/revision/project doesn't exist.
4188 # 500: The server isn't configured properly, or
4189 #      an internal error occurred (e.g. failed assertions caused by bugs), or
4190 #      an unknown error occurred (e.g. the git binary died unexpectedly).
4191 # 503: The server is currently unavailable (because it is overloaded,
4192 #      or down for maintenance).  Generally, this is a temporary state.
4193 sub die_error {
4194         my $status = shift || 500;
4195         my $error = esc_html(shift) || "Internal Server Error";
4196         my $extra = shift;
4197         my %opts = @_;
4198
4199         my %http_responses = (
4200                 400 => '400 Bad Request',
4201                 403 => '403 Forbidden',
4202                 404 => '404 Not Found',
4203                 500 => '500 Internal Server Error',
4204                 503 => '503 Service Unavailable',
4205         );
4206         git_header_html($http_responses{$status}, undef, %opts);
4207         print <<EOF;
4208 <div class="page_body">
4209 <br /><br />
4210 $status - $error
4211 <br />
4212 EOF
4213         if (defined $extra) {
4214                 print "<hr />\n" .
4215                       "$extra\n";
4216         }
4217         print "</div>\n";
4218
4219         git_footer_html();
4220         goto DONE_GITWEB
4221                 unless ($opts{'-error_handler'});
4222 }
4223
4224 ## ----------------------------------------------------------------------
4225 ## functions printing or outputting HTML: navigation
4226
4227 sub git_print_page_nav {
4228         my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4229         $extra = '' if !defined $extra; # pager or formats
4230
4231         my @navs = qw(summary shortlog log commit commitdiff tree);
4232         if ($suppress) {
4233                 @navs = grep { $_ ne $suppress } @navs;
4234         }
4235
4236         my %arg = map { $_ => {action=>$_} } @navs;
4237         if (defined $head) {
4238                 for (qw(commit commitdiff)) {
4239                         $arg{$_}{'hash'} = $head;
4240                 }
4241                 if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4242                         for (qw(shortlog log)) {
4243                                 $arg{$_}{'hash'} = $head;
4244                         }
4245                 }
4246         }
4247
4248         $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4249         $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4250
4251         my @actions = gitweb_get_feature('actions');
4252         my %repl = (
4253                 '%' => '%',
4254                 'n' => $project,         # project name
4255                 'f' => $git_dir,         # project path within filesystem
4256                 'h' => $treehead || '',  # current hash ('h' parameter)
4257                 'b' => $treebase || '',  # hash base ('hb' parameter)
4258         );
4259         while (@actions) {
4260                 my ($label, $link, $pos) = splice(@actions,0,3);
4261                 # insert
4262                 @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4263                 # munch munch
4264                 $link =~ s/%([%nfhb])/$repl{$1}/g;
4265                 $arg{$label}{'_href'} = $link;
4266         }
4267
4268         print "<div class=\"page_nav\">\n" .
4269                 (join " | ",
4270                  map { $_ eq $current ?
4271                        $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4272                  } @navs);
4273         print "<br/>\n$extra<br/>\n" .
4274               "</div>\n";
4275 }
4276
4277 # returns a submenu for the nagivation of the refs views (tags, heads,
4278 # remotes) with the current view disabled and the remotes view only
4279 # available if the feature is enabled
4280 sub format_ref_views {
4281         my ($current) = @_;
4282         my @ref_views = qw{tags heads};
4283         push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4284         return join " | ", map {
4285                 $_ eq $current ? $_ :
4286                 $cgi->a({-href => href(action=>$_)}, $_)
4287         } @ref_views
4288 }
4289
4290 sub format_paging_nav {
4291         my ($action, $page, $has_next_link) = @_;
4292         my $paging_nav;
4293
4294
4295         if ($page > 0) {
4296                 $paging_nav .=
4297                         $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4298                         " &sdot; " .
4299                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
4300                                  -accesskey => "p", -title => "Alt-p"}, "prev");
4301         } else {
4302                 $paging_nav .= "first &sdot; prev";
4303         }
4304
4305         if ($has_next_link) {
4306                 $paging_nav .= " &sdot; " .
4307                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
4308                                  -accesskey => "n", -title => "Alt-n"}, "next");
4309         } else {
4310                 $paging_nav .= " &sdot; next";
4311         }
4312
4313         return $paging_nav;
4314 }
4315
4316 ## ......................................................................
4317 ## functions printing or outputting HTML: div
4318
4319 sub git_print_header_div {
4320         my ($action, $title, $hash, $hash_base) = @_;
4321         my %args = ();
4322
4323         $args{'action'} = $action;
4324         $args{'hash'} = $hash if $hash;
4325         $args{'hash_base'} = $hash_base if $hash_base;
4326
4327         print "<div class=\"header\">\n" .
4328               $cgi->a({-href => href(%args), -class => "title"},
4329               $title ? $title : $action) .
4330               "\n</div>\n";
4331 }
4332
4333 sub format_repo_url {
4334         my ($name, $url) = @_;
4335         return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4336 }
4337
4338 # Group output by placing it in a DIV element and adding a header.
4339 # Options for start_div() can be provided by passing a hash reference as the
4340 # first parameter to the function.
4341 # Options to git_print_header_div() can be provided by passing an array
4342 # reference. This must follow the options to start_div if they are present.
4343 # The content can be a scalar, which is output as-is, a scalar reference, which
4344 # is output after html escaping, an IO handle passed either as *handle or
4345 # *handle{IO}, or a function reference. In the latter case all following
4346 # parameters will be taken as argument to the content function call.
4347 sub git_print_section {
4348         my ($div_args, $header_args, $content);
4349         my $arg = shift;
4350         if (ref($arg) eq 'HASH') {
4351                 $div_args = $arg;
4352                 $arg = shift;
4353         }
4354         if (ref($arg) eq 'ARRAY') {
4355                 $header_args = $arg;
4356                 $arg = shift;
4357         }
4358         $content = $arg;
4359
4360         print $cgi->start_div($div_args);
4361         git_print_header_div(@$header_args);
4362
4363         if (ref($content) eq 'CODE') {
4364                 $content->(@_);
4365         } elsif (ref($content) eq 'SCALAR') {
4366                 print esc_html($$content);
4367         } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4368                 print <$content>;
4369         } elsif (!ref($content) && defined($content)) {
4370                 print $content;
4371         }
4372
4373         print $cgi->end_div;
4374 }
4375
4376 sub format_timestamp_html {
4377         my $date = shift;
4378         my $strtime = $date->{'rfc2822'};
4379
4380         my (undef, undef, $datetime_class) =
4381                 gitweb_get_feature('javascript-timezone');
4382         if ($datetime_class) {
4383                 $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4384         }
4385
4386         my $localtime_format = '(%02d:%02d %s)';
4387         if ($date->{'hour_local'} < 6) {
4388                 $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4389         }
4390         $strtime .= ' ' .
4391                     sprintf($localtime_format,
4392                             $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4393
4394         return $strtime;
4395 }
4396
4397 # Outputs the author name and date in long form
4398 sub git_print_authorship {
4399         my $co = shift;
4400         my %opts = @_;
4401         my $tag = $opts{-tag} || 'div';
4402         my $author = $co->{'author_name'};
4403
4404         my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4405         print "<$tag class=\"author_date\">" .
4406               format_search_author($author, "author", esc_html($author)) .
4407               " [".format_timestamp_html(\%ad)."]".
4408               git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4409               "</$tag>\n";
4410 }
4411
4412 # Outputs table rows containing the full author or committer information,
4413 # in the format expected for 'commit' view (& similar).
4414 # Parameters are a commit hash reference, followed by the list of people
4415 # to output information for. If the list is empty it defaults to both
4416 # author and committer.
4417 sub git_print_authorship_rows {
4418         my $co = shift;
4419         # too bad we can't use @people = @_ || ('author', 'committer')
4420         my @people = @_;
4421         @people = ('author', 'committer') unless @people;
4422         foreach my $who (@people) {
4423                 my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4424                 print "<tr><td>$who</td><td>" .
4425                       format_search_author($co->{"${who}_name"}, $who,
4426                                            esc_html($co->{"${who}_name"})) . " " .
4427                       format_search_author($co->{"${who}_email"}, $who,
4428                                            esc_html("<" . $co->{"${who}_email"} . ">")) .
4429                       "</td><td rowspan=\"2\">" .
4430                       git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4431                       "</td></tr>\n" .
4432                       "<tr>" .
4433                       "<td></td><td>" .
4434                       format_timestamp_html(\%wd) .
4435                       "</td>" .
4436                       "</tr>\n";
4437         }
4438 }
4439
4440 sub git_print_page_path {
4441         my $name = shift;
4442         my $type = shift;
4443         my $hb = shift;
4444
4445
4446         print "<div class=\"page_path\">";
4447         print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4448                       -title => 'tree root'}, to_utf8("[$project]"));
4449         print " / ";
4450         if (defined $name) {
4451                 my @dirname = split '/', $name;
4452                 my $basename = pop @dirname;
4453                 my $fullname = '';
4454
4455                 foreach my $dir (@dirname) {
4456                         $fullname .= ($fullname ? '/' : '') . $dir;
4457                         print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4458                                                      hash_base=>$hb),
4459                                       -title => $fullname}, esc_path($dir));
4460                         print " / ";
4461                 }
4462                 if (defined $type && $type eq 'blob') {
4463                         print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4464                                                      hash_base=>$hb),
4465                                       -title => $name}, esc_path($basename));
4466                 } elsif (defined $type && $type eq 'tree') {
4467                         print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4468                                                      hash_base=>$hb),
4469                                       -title => $name}, esc_path($basename));
4470                         print " / ";
4471                 } else {
4472                         print esc_path($basename);
4473                 }
4474         }
4475         print "<br/></div>\n";
4476 }
4477
4478 sub git_print_log {
4479         my $log = shift;
4480         my %opts = @_;
4481
4482         if ($opts{'-remove_title'}) {
4483                 # remove title, i.e. first line of log
4484                 shift @$log;
4485         }
4486         # remove leading empty lines
4487         while (defined $log->[0] && $log->[0] eq "") {
4488                 shift @$log;
4489         }
4490
4491         # print log
4492         my $signoff = 0;
4493         my $empty = 0;
4494         foreach my $line (@$log) {
4495                 if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4496                         $signoff = 1;
4497                         $empty = 0;
4498                         if (! $opts{'-remove_signoff'}) {
4499                                 print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4500                                 next;
4501                         } else {
4502                                 # remove signoff lines
4503                                 next;
4504                         }
4505                 } else {
4506                         $signoff = 0;
4507                 }
4508
4509                 # print only one empty line
4510                 # do not print empty line after signoff
4511                 if ($line eq "") {
4512                         next if ($empty || $signoff);
4513                         $empty = 1;
4514                 } else {
4515                         $empty = 0;
4516                 }
4517
4518                 print format_log_line_html($line) . "<br/>\n";
4519         }
4520
4521         if ($opts{'-final_empty_line'}) {
4522                 # end with single empty line
4523                 print "<br/>\n" unless $empty;
4524         }
4525 }
4526
4527 # return link target (what link points to)
4528 sub git_get_link_target {
4529         my $hash = shift;
4530         my $link_target;
4531
4532         # read link
4533         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4534                 or return;
4535         {
4536                 local $/ = undef;
4537                 $link_target = <$fd>;
4538         }
4539         close $fd
4540                 or return;
4541
4542         return $link_target;
4543 }
4544
4545 # given link target, and the directory (basedir) the link is in,
4546 # return target of link relative to top directory (top tree);
4547 # return undef if it is not possible (including absolute links).
4548 sub normalize_link_target {
4549         my ($link_target, $basedir) = @_;
4550
4551         # absolute symlinks (beginning with '/') cannot be normalized
4552         return if (substr($link_target, 0, 1) eq '/');
4553
4554         # normalize link target to path from top (root) tree (dir)
4555         my $path;
4556         if ($basedir) {
4557                 $path = $basedir . '/' . $link_target;
4558         } else {
4559                 # we are in top (root) tree (dir)
4560                 $path = $link_target;
4561         }
4562
4563         # remove //, /./, and /../
4564         my @path_parts;
4565         foreach my $part (split('/', $path)) {
4566                 # discard '.' and ''
4567                 next if (!$part || $part eq '.');
4568                 # handle '..'
4569                 if ($part eq '..') {
4570                         if (@path_parts) {
4571                                 pop @path_parts;
4572                         } else {
4573                                 # link leads outside repository (outside top dir)
4574                                 return;
4575                         }
4576                 } else {
4577                         push @path_parts, $part;
4578                 }
4579         }
4580         $path = join('/', @path_parts);
4581
4582         return $path;
4583 }
4584
4585 # print tree entry (row of git_tree), but without encompassing <tr> element
4586 sub git_print_tree_entry {
4587         my ($t, $basedir, $hash_base, $have_blame) = @_;
4588
4589         my %base_key = ();
4590         $base_key{'hash_base'} = $hash_base if defined $hash_base;
4591
4592         # The format of a table row is: mode list link.  Where mode is
4593         # the mode of the entry, list is the name of the entry, an href,
4594         # and link is the action links of the entry.
4595
4596         print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4597         if (exists $t->{'size'}) {
4598                 print "<td class=\"size\">$t->{'size'}</td>\n";
4599         }
4600         if ($t->{'type'} eq "blob") {
4601                 print "<td class=\"list\">" .
4602                         $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4603                                                file_name=>"$basedir$t->{'name'}", %base_key),
4604                                 -class => "list"}, esc_path($t->{'name'}));
4605                 if (S_ISLNK(oct $t->{'mode'})) {
4606                         my $link_target = git_get_link_target($t->{'hash'});
4607                         if ($link_target) {
4608                                 my $norm_target = normalize_link_target($link_target, $basedir);
4609                                 if (defined $norm_target) {
4610                                         print " -> " .
4611                                               $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4612                                                                      file_name=>$norm_target),
4613                                                        -title => $norm_target}, esc_path($link_target));
4614                                 } else {
4615                                         print " -> " . esc_path($link_target);
4616                                 }
4617                         }
4618                 }
4619                 print "</td>\n";
4620                 print "<td class=\"link\">";
4621                 print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4622                                              file_name=>"$basedir$t->{'name'}", %base_key)},
4623                               "blob");
4624                 if ($have_blame) {
4625                         print " | " .
4626                               $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4627                                                      file_name=>"$basedir$t->{'name'}", %base_key)},
4628                                       "blame");
4629                 }
4630                 if (defined $hash_base) {
4631                         print " | " .
4632                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4633                                                      hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4634                                       "history");
4635                 }
4636                 print " | " .
4637                         $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4638                                                file_name=>"$basedir$t->{'name'}")},
4639                                 "raw");
4640                 print "</td>\n";
4641
4642         } elsif ($t->{'type'} eq "tree") {
4643                 print "<td class=\"list\">";
4644                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4645                                              file_name=>"$basedir$t->{'name'}",
4646                                              %base_key)},
4647                               esc_path($t->{'name'}));
4648                 print "</td>\n";
4649                 print "<td class=\"link\">";
4650                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4651                                              file_name=>"$basedir$t->{'name'}",
4652                                              %base_key)},
4653                               "tree");
4654                 if (defined $hash_base) {
4655                         print " | " .
4656                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4657                                                      file_name=>"$basedir$t->{'name'}")},
4658                                       "history");
4659                 }
4660                 print "</td>\n";
4661         } else {
4662                 # unknown object: we can only present history for it
4663                 # (this includes 'commit' object, i.e. submodule support)
4664                 print "<td class=\"list\">" .
4665                       esc_path($t->{'name'}) .
4666                       "</td>\n";
4667                 print "<td class=\"link\">";
4668                 if (defined $hash_base) {
4669                         print $cgi->a({-href => href(action=>"history",
4670                                                      hash_base=>$hash_base,
4671                                                      file_name=>"$basedir$t->{'name'}")},
4672                                       "history");
4673                 }
4674                 print "</td>\n";
4675         }
4676 }
4677
4678 ## ......................................................................
4679 ## functions printing large fragments of HTML
4680
4681 # get pre-image filenames for merge (combined) diff
4682 sub fill_from_file_info {
4683         my ($diff, @parents) = @_;
4684
4685         $diff->{'from_file'} = [ ];
4686         $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4687         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4688                 if ($diff->{'status'}[$i] eq 'R' ||
4689                     $diff->{'status'}[$i] eq 'C') {
4690                         $diff->{'from_file'}[$i] =
4691                                 git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4692                 }
4693         }
4694
4695         return $diff;
4696 }
4697
4698 # is current raw difftree line of file deletion
4699 sub is_deleted {
4700         my $diffinfo = shift;
4701
4702         return $diffinfo->{'to_id'} eq ('0' x 40);
4703 }
4704
4705 # does patch correspond to [previous] difftree raw line
4706 # $diffinfo  - hashref of parsed raw diff format
4707 # $patchinfo - hashref of parsed patch diff format
4708 #              (the same keys as in $diffinfo)
4709 sub is_patch_split {
4710         my ($diffinfo, $patchinfo) = @_;
4711
4712         return defined $diffinfo && defined $patchinfo
4713                 && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4714 }
4715
4716
4717 sub git_difftree_body {
4718         my ($difftree, $hash, @parents) = @_;
4719         my ($parent) = $parents[0];
4720         my $have_blame = gitweb_check_feature('blame');
4721         print "<div class=\"list_head\">\n";
4722         if ($#{$difftree} > 10) {
4723                 print(($#{$difftree} + 1) . " files changed:\n");
4724         }
4725         print "</div>\n";
4726
4727         print "<table class=\"" .
4728               (@parents > 1 ? "combined " : "") .
4729               "diff_tree\">\n";
4730
4731         # header only for combined diff in 'commitdiff' view
4732         my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4733         if ($has_header) {
4734                 # table header
4735                 print "<thead><tr>\n" .
4736                        "<th></th><th></th>\n"; # filename, patchN link
4737                 for (my $i = 0; $i < @parents; $i++) {
4738                         my $par = $parents[$i];
4739                         print "<th>" .
4740                               $cgi->a({-href => href(action=>"commitdiff",
4741                                                      hash=>$hash, hash_parent=>$par),
4742                                        -title => 'commitdiff to parent number ' .
4743                                                   ($i+1) . ': ' . substr($par,0,7)},
4744                                       $i+1) .
4745                               "&nbsp;</th>\n";
4746                 }
4747                 print "</tr></thead>\n<tbody>\n";
4748         }
4749
4750         my $alternate = 1;
4751         my $patchno = 0;
4752         foreach my $line (@{$difftree}) {
4753                 my $diff = parsed_difftree_line($line);
4754
4755                 if ($alternate) {
4756                         print "<tr class=\"dark\">\n";
4757                 } else {
4758                         print "<tr class=\"light\">\n";
4759                 }
4760                 $alternate ^= 1;
4761
4762                 if (exists $diff->{'nparents'}) { # combined diff
4763
4764                         fill_from_file_info($diff, @parents)
4765                                 unless exists $diff->{'from_file'};
4766
4767                         if (!is_deleted($diff)) {
4768                                 # file exists in the result (child) commit
4769                                 print "<td>" .
4770                                       $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4771                                                              file_name=>$diff->{'to_file'},
4772                                                              hash_base=>$hash),
4773                                               -class => "list"}, esc_path($diff->{'to_file'})) .
4774                                       "</td>\n";
4775                         } else {
4776                                 print "<td>" .
4777                                       esc_path($diff->{'to_file'}) .
4778                                       "</td>\n";
4779                         }
4780
4781                         if ($action eq 'commitdiff') {
4782                                 # link to patch
4783                                 $patchno++;
4784                                 print "<td class=\"link\">" .
4785                                       $cgi->a({-href => href(-anchor=>"patch$patchno")},
4786                                               "patch") .
4787                                       " | " .
4788                                       "</td>\n";
4789                         }
4790
4791                         my $has_history = 0;
4792                         my $not_deleted = 0;
4793                         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4794                                 my $hash_parent = $parents[$i];
4795                                 my $from_hash = $diff->{'from_id'}[$i];
4796                                 my $from_path = $diff->{'from_file'}[$i];
4797                                 my $status = $diff->{'status'}[$i];
4798
4799                                 $has_history ||= ($status ne 'A');
4800                                 $not_deleted ||= ($status ne 'D');
4801
4802                                 if ($status eq 'A') {
4803                                         print "<td  class=\"link\" align=\"right\"> | </td>\n";
4804                                 } elsif ($status eq 'D') {
4805                                         print "<td class=\"link\">" .
4806                                               $cgi->a({-href => href(action=>"blob",
4807                                                                      hash_base=>$hash,
4808                                                                      hash=>$from_hash,
4809                                                                      file_name=>$from_path)},
4810                                                       "blob" . ($i+1)) .
4811                                               " | </td>\n";
4812                                 } else {
4813                                         if ($diff->{'to_id'} eq $from_hash) {
4814                                                 print "<td class=\"link nochange\">";
4815                                         } else {
4816                                                 print "<td class=\"link\">";
4817                                         }
4818                                         print $cgi->a({-href => href(action=>"blobdiff",
4819                                                                      hash=>$diff->{'to_id'},
4820                                                                      hash_parent=>$from_hash,
4821                                                                      hash_base=>$hash,
4822                                                                      hash_parent_base=>$hash_parent,
4823                                                                      file_name=>$diff->{'to_file'},
4824                                                                      file_parent=>$from_path)},
4825                                                       "diff" . ($i+1)) .
4826                                               " | </td>\n";
4827                                 }
4828                         }
4829
4830                         print "<td class=\"link\">";
4831                         if ($not_deleted) {
4832                                 print $cgi->a({-href => href(action=>"blob",
4833                                                              hash=>$diff->{'to_id'},
4834                                                              file_name=>$diff->{'to_file'},
4835                                                              hash_base=>$hash)},
4836                                               "blob");
4837                                 print " | " if ($has_history);
4838                         }
4839                         if ($has_history) {
4840                                 print $cgi->a({-href => href(action=>"history",
4841                                                              file_name=>$diff->{'to_file'},
4842                                                              hash_base=>$hash)},
4843                                               "history");
4844                         }
4845                         print "</td>\n";
4846
4847                         print "</tr>\n";
4848                         next; # instead of 'else' clause, to avoid extra indent
4849                 }
4850                 # else ordinary diff
4851
4852                 my ($to_mode_oct, $to_mode_str, $to_file_type);
4853                 my ($from_mode_oct, $from_mode_str, $from_file_type);
4854                 if ($diff->{'to_mode'} ne ('0' x 6)) {
4855                         $to_mode_oct = oct $diff->{'to_mode'};
4856                         if (S_ISREG($to_mode_oct)) { # only for regular file
4857                                 $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4858                         }
4859                         $to_file_type = file_type($diff->{'to_mode'});
4860                 }
4861                 if ($diff->{'from_mode'} ne ('0' x 6)) {
4862                         $from_mode_oct = oct $diff->{'from_mode'};
4863                         if (S_ISREG($from_mode_oct)) { # only for regular file
4864                                 $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4865                         }
4866                         $from_file_type = file_type($diff->{'from_mode'});
4867                 }
4868
4869                 if ($diff->{'status'} eq "A") { # created
4870                         my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4871                         $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4872                         $mode_chng   .= "]</span>";
4873                         print "<td>";
4874                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4875                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4876                                       -class => "list"}, esc_path($diff->{'file'}));
4877                         print "</td>\n";
4878                         print "<td>$mode_chng</td>\n";
4879                         print "<td class=\"link\">";
4880                         if ($action eq 'commitdiff') {
4881                                 # link to patch
4882                                 $patchno++;
4883                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4884                                               "patch") .
4885                                       " | ";
4886                         }
4887                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4888                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4889                                       "blob");
4890                         print "</td>\n";
4891
4892                 } elsif ($diff->{'status'} eq "D") { # deleted
4893                         my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4894                         print "<td>";
4895                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4896                                                      hash_base=>$parent, file_name=>$diff->{'file'}),
4897                                        -class => "list"}, esc_path($diff->{'file'}));
4898                         print "</td>\n";
4899                         print "<td>$mode_chng</td>\n";
4900                         print "<td class=\"link\">";
4901                         if ($action eq 'commitdiff') {
4902                                 # link to patch
4903                                 $patchno++;
4904                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4905                                               "patch") .
4906                                       " | ";
4907                         }
4908                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4909                                                      hash_base=>$parent, file_name=>$diff->{'file'})},
4910                                       "blob") . " | ";
4911                         if ($have_blame) {
4912                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4913                                                              file_name=>$diff->{'file'})},
4914                                               "blame") . " | ";
4915                         }
4916                         print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4917                                                      file_name=>$diff->{'file'})},
4918                                       "history");
4919                         print "</td>\n";
4920
4921                 } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4922                         my $mode_chnge = "";
4923                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4924                                 $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4925                                 if ($from_file_type ne $to_file_type) {
4926                                         $mode_chnge .= " from $from_file_type to $to_file_type";
4927                                 }
4928                                 if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4929                                         if ($from_mode_str && $to_mode_str) {
4930                                                 $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4931                                         } elsif ($to_mode_str) {
4932                                                 $mode_chnge .= " mode: $to_mode_str";
4933                                         }
4934                                 }
4935                                 $mode_chnge .= "]</span>\n";
4936                         }
4937                         print "<td>";
4938                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4939                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4940                                       -class => "list"}, esc_path($diff->{'file'}));
4941                         print "</td>\n";
4942                         print "<td>$mode_chnge</td>\n";
4943                         print "<td class=\"link\">";
4944                         if ($action eq 'commitdiff') {
4945                                 # link to patch
4946                                 $patchno++;
4947                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4948                                               "patch") .
4949                                       " | ";
4950                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4951                                 # "commit" view and modified file (not onlu mode changed)
4952                                 print $cgi->a({-href => href(action=>"blobdiff",
4953                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4954                                                              hash_base=>$hash, hash_parent_base=>$parent,
4955                                                              file_name=>$diff->{'file'})},
4956                                               "diff") .
4957                                       " | ";
4958                         }
4959                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4960                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4961                                        "blob") . " | ";
4962                         if ($have_blame) {
4963                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4964                                                              file_name=>$diff->{'file'})},
4965                                               "blame") . " | ";
4966                         }
4967                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4968                                                      file_name=>$diff->{'file'})},
4969                                       "history");
4970                         print "</td>\n";
4971
4972                 } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4973                         my %status_name = ('R' => 'moved', 'C' => 'copied');
4974                         my $nstatus = $status_name{$diff->{'status'}};
4975                         my $mode_chng = "";
4976                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4977                                 # mode also for directories, so we cannot use $to_mode_str
4978                                 $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4979                         }
4980                         print "<td>" .
4981                               $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4982                                                      hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4983                                       -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4984                               "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4985                               $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4986                                                      hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4987                                       -class => "list"}, esc_path($diff->{'from_file'})) .
4988                               " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4989                               "<td class=\"link\">";
4990                         if ($action eq 'commitdiff') {
4991                                 # link to patch
4992                                 $patchno++;
4993                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4994                                               "patch") .
4995                                       " | ";
4996                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4997                                 # "commit" view and modified file (not only pure rename or copy)
4998                                 print $cgi->a({-href => href(action=>"blobdiff",
4999                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
5000                                                              hash_base=>$hash, hash_parent_base=>$parent,
5001                                                              file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
5002                                               "diff") .
5003                                       " | ";
5004                         }
5005                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
5006                                                      hash_base=>$parent, file_name=>$diff->{'to_file'})},
5007                                       "blob") . " | ";
5008                         if ($have_blame) {
5009                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
5010                                                              file_name=>$diff->{'to_file'})},
5011                                               "blame") . " | ";
5012                         }
5013                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
5014                                                     file_name=>$diff->{'to_file'})},
5015                                       "history");
5016                         print "</td>\n";
5017
5018                 } # we should not encounter Unmerged (U) or Unknown (X) status
5019                 print "</tr>\n";
5020         }
5021         print "</tbody>" if $has_header;
5022         print "</table>\n";
5023 }
5024
5025 # Print context lines and then rem/add lines in a side-by-side manner.
5026 sub print_sidebyside_diff_lines {
5027         my ($ctx, $rem, $add) = @_;
5028
5029         # print context block before add/rem block
5030         if (@$ctx) {
5031                 print join '',
5032                         '<div class="chunk_block ctx">',
5033                                 '<div class="old">',
5034                                 @$ctx,
5035                                 '</div>',
5036                                 '<div class="new">',
5037                                 @$ctx,
5038                                 '</div>',
5039                         '</div>';
5040         }
5041
5042         if (!@$add) {
5043                 # pure removal
5044                 print join '',
5045                         '<div class="chunk_block rem">',
5046                                 '<div class="old">',
5047                                 @$rem,
5048                                 '</div>',
5049                         '</div>';
5050         } elsif (!@$rem) {
5051                 # pure addition
5052                 print join '',
5053                         '<div class="chunk_block add">',
5054                                 '<div class="new">',
5055                                 @$add,
5056                                 '</div>',
5057                         '</div>';
5058         } else {
5059                 print join '',
5060                         '<div class="chunk_block chg">',
5061                                 '<div class="old">',
5062                                 @$rem,
5063                                 '</div>',
5064                                 '<div class="new">',
5065                                 @$add,
5066                                 '</div>',
5067                         '</div>';
5068         }
5069 }
5070
5071 # Print context lines and then rem/add lines in inline manner.
5072 sub print_inline_diff_lines {
5073         my ($ctx, $rem, $add) = @_;
5074
5075         print @$ctx, @$rem, @$add;
5076 }
5077
5078 # Format removed and added line, mark changed part and HTML-format them.
5079 # Implementation is based on contrib/diff-highlight
5080 sub format_rem_add_lines_pair {
5081         my ($rem, $add, $num_parents) = @_;
5082
5083         # We need to untabify lines before split()'ing them;
5084         # otherwise offsets would be invalid.
5085         chomp $rem;
5086         chomp $add;
5087         $rem = untabify($rem);
5088         $add = untabify($add);
5089
5090         my @rem = split(//, $rem);
5091         my @add = split(//, $add);
5092         my ($esc_rem, $esc_add);
5093         # Ignore leading +/- characters for each parent.
5094         my ($prefix_len, $suffix_len) = ($num_parents, 0);
5095         my ($prefix_has_nonspace, $suffix_has_nonspace);
5096
5097         my $shorter = (@rem < @add) ? @rem : @add;
5098         while ($prefix_len < $shorter) {
5099                 last if ($rem[$prefix_len] ne $add[$prefix_len]);
5100
5101                 $prefix_has_nonspace = 1 if ($rem[$prefix_len] !~ /\s/);
5102                 $prefix_len++;
5103         }
5104
5105         while ($prefix_len + $suffix_len < $shorter) {
5106                 last if ($rem[-1 - $suffix_len] ne $add[-1 - $suffix_len]);
5107
5108                 $suffix_has_nonspace = 1 if ($rem[-1 - $suffix_len] !~ /\s/);
5109                 $suffix_len++;
5110         }
5111
5112         # Mark lines that are different from each other, but have some common
5113         # part that isn't whitespace.  If lines are completely different, don't
5114         # mark them because that would make output unreadable, especially if
5115         # diff consists of multiple lines.
5116         if ($prefix_has_nonspace || $suffix_has_nonspace) {
5117                 $esc_rem = esc_html_hl_regions($rem, 'marked',
5118                         [$prefix_len, @rem - $suffix_len], -nbsp=>1);
5119                 $esc_add = esc_html_hl_regions($add, 'marked',
5120                         [$prefix_len, @add - $suffix_len], -nbsp=>1);
5121         } else {
5122                 $esc_rem = esc_html($rem, -nbsp=>1);
5123                 $esc_add = esc_html($add, -nbsp=>1);
5124         }
5125
5126         return format_diff_line(\$esc_rem, 'rem'),
5127                format_diff_line(\$esc_add, 'add');
5128 }
5129
5130 # HTML-format diff context, removed and added lines.
5131 sub format_ctx_rem_add_lines {
5132         my ($ctx, $rem, $add, $num_parents) = @_;
5133         my (@new_ctx, @new_rem, @new_add);
5134         my $can_highlight = 0;
5135         my $is_combined = ($num_parents > 1);
5136
5137         # Highlight if every removed line has a corresponding added line.
5138         if (@$add > 0 && @$add == @$rem) {
5139                 $can_highlight = 1;
5140
5141                 # Highlight lines in combined diff only if the chunk contains
5142                 # diff between the same version, e.g.
5143                 #
5144                 #    - a
5145                 #   -  b
5146                 #    + c
5147                 #   +  d
5148                 #
5149                 # Otherwise the highlightling would be confusing.
5150                 if ($is_combined) {
5151                         for (my $i = 0; $i < @$add; $i++) {
5152                                 my $prefix_rem = substr($rem->[$i], 0, $num_parents);
5153                                 my $prefix_add = substr($add->[$i], 0, $num_parents);
5154
5155                                 $prefix_rem =~ s/-/+/g;
5156
5157                                 if ($prefix_rem ne $prefix_add) {
5158                                         $can_highlight = 0;
5159                                         last;
5160                                 }
5161                         }
5162                 }
5163         }
5164
5165         if ($can_highlight) {
5166                 for (my $i = 0; $i < @$add; $i++) {
5167                         my ($line_rem, $line_add) = format_rem_add_lines_pair(
5168                                 $rem->[$i], $add->[$i], $num_parents);
5169                         push @new_rem, $line_rem;
5170                         push @new_add, $line_add;
5171                 }
5172         } else {
5173                 @new_rem = map { format_diff_line($_, 'rem') } @$rem;
5174                 @new_add = map { format_diff_line($_, 'add') } @$add;
5175         }
5176
5177         @new_ctx = map { format_diff_line($_, 'ctx') } @$ctx;
5178
5179         return (\@new_ctx, \@new_rem, \@new_add);
5180 }
5181
5182 # Print context lines and then rem/add lines.
5183 sub print_diff_lines {
5184         my ($ctx, $rem, $add, $diff_style, $num_parents) = @_;
5185         my $is_combined = $num_parents > 1;
5186
5187         ($ctx, $rem, $add) = format_ctx_rem_add_lines($ctx, $rem, $add,
5188                 $num_parents);
5189
5190         if ($diff_style eq 'sidebyside' && !$is_combined) {
5191                 print_sidebyside_diff_lines($ctx, $rem, $add);
5192         } else {
5193                 # default 'inline' style and unknown styles
5194                 print_inline_diff_lines($ctx, $rem, $add);
5195         }
5196 }
5197
5198 sub print_diff_chunk {
5199         my ($diff_style, $num_parents, $from, $to, @chunk) = @_;
5200         my (@ctx, @rem, @add);
5201
5202         # The class of the previous line.
5203         my $prev_class = '';
5204
5205         return unless @chunk;
5206
5207         # incomplete last line might be among removed or added lines,
5208         # or both, or among context lines: find which
5209         for (my $i = 1; $i < @chunk; $i++) {
5210                 if ($chunk[$i][0] eq 'incomplete') {
5211                         $chunk[$i][0] = $chunk[$i-1][0];
5212                 }
5213         }
5214
5215         # guardian
5216         push @chunk, ["", ""];
5217
5218         foreach my $line_info (@chunk) {
5219                 my ($class, $line) = @$line_info;
5220
5221                 # print chunk headers
5222                 if ($class && $class eq 'chunk_header') {
5223                         print format_diff_line($line, $class, $from, $to);
5224                         next;
5225                 }
5226
5227                 ## print from accumulator when have some add/rem lines or end
5228                 # of chunk (flush context lines), or when have add and rem
5229                 # lines and new block is reached (otherwise add/rem lines could
5230                 # be reordered)
5231                 if (!$class || ((@rem || @add) && $class eq 'ctx') ||
5232                     (@rem && @add && $class ne $prev_class)) {
5233                         print_diff_lines(\@ctx, \@rem, \@add,
5234                                          $diff_style, $num_parents);
5235                         @ctx = @rem = @add = ();
5236                 }
5237
5238                 ## adding lines to accumulator
5239                 # guardian value
5240                 last unless $line;
5241                 # rem, add or change
5242                 if ($class eq 'rem') {
5243                         push @rem, $line;
5244                 } elsif ($class eq 'add') {
5245                         push @add, $line;
5246                 }
5247                 # context line
5248                 if ($class eq 'ctx') {
5249                         push @ctx, $line;
5250                 }
5251
5252                 $prev_class = $class;
5253         }
5254 }
5255
5256 sub git_patchset_body {
5257         my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
5258         my ($hash_parent) = $hash_parents[0];
5259
5260         my $is_combined = (@hash_parents > 1);
5261         my $patch_idx = 0;
5262         my $patch_number = 0;
5263         my $patch_line;
5264         my $diffinfo;
5265         my $to_name;
5266         my (%from, %to);
5267         my @chunk; # for side-by-side diff
5268
5269         print "<div class=\"patchset\">\n";
5270
5271         # skip to first patch
5272         while ($patch_line = <$fd>) {
5273                 chomp $patch_line;
5274
5275                 last if ($patch_line =~ m/^diff /);
5276         }
5277
5278  PATCH:
5279         while ($patch_line) {
5280
5281                 # parse "git diff" header line
5282                 if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
5283                         # $1 is from_name, which we do not use
5284                         $to_name = unquote($2);
5285                         $to_name =~ s!^b/!!;
5286                 } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
5287                         # $1 is 'cc' or 'combined', which we do not use
5288                         $to_name = unquote($2);
5289                 } else {
5290                         $to_name = undef;
5291                 }
5292
5293                 # check if current patch belong to current raw line
5294                 # and parse raw git-diff line if needed
5295                 if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
5296                         # this is continuation of a split patch
5297                         print "<div class=\"patch cont\">\n";
5298                 } else {
5299                         # advance raw git-diff output if needed
5300                         $patch_idx++ if defined $diffinfo;
5301
5302                         # read and prepare patch information
5303                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5304
5305                         # compact combined diff output can have some patches skipped
5306                         # find which patch (using pathname of result) we are at now;
5307                         if ($is_combined) {
5308                                 while ($to_name ne $diffinfo->{'to_file'}) {
5309                                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5310                                               format_diff_cc_simplified($diffinfo, @hash_parents) .
5311                                               "</div>\n";  # class="patch"
5312
5313                                         $patch_idx++;
5314                                         $patch_number++;
5315
5316                                         last if $patch_idx > $#$difftree;
5317                                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5318                                 }
5319                         }
5320
5321                         # modifies %from, %to hashes
5322                         parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5323
5324                         # this is first patch for raw difftree line with $patch_idx index
5325                         # we index @$difftree array from 0, but number patches from 1
5326                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5327                 }
5328
5329                 # git diff header
5330                 #assert($patch_line =~ m/^diff /) if DEBUG;
5331                 #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5332                 $patch_number++;
5333                 # print "git diff" header
5334                 print format_git_diff_header_line($patch_line, $diffinfo,
5335                                                   \%from, \%to);
5336
5337                 # print extended diff header
5338                 print "<div class=\"diff extended_header\">\n";
5339         EXTENDED_HEADER:
5340                 while ($patch_line = <$fd>) {
5341                         chomp $patch_line;
5342
5343                         last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5344
5345                         print format_extended_diff_header_line($patch_line, $diffinfo,
5346                                                                \%from, \%to);
5347                 }
5348                 print "</div>\n"; # class="diff extended_header"
5349
5350                 # from-file/to-file diff header
5351                 if (! $patch_line) {
5352                         print "</div>\n"; # class="patch"
5353                         last PATCH;
5354                 }
5355                 next PATCH if ($patch_line =~ m/^diff /);
5356                 #assert($patch_line =~ m/^---/) if DEBUG;
5357
5358                 my $last_patch_line = $patch_line;
5359                 $patch_line = <$fd>;
5360                 chomp $patch_line;
5361                 #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5362
5363                 print format_diff_from_to_header($last_patch_line, $patch_line,
5364                                                  $diffinfo, \%from, \%to,
5365                                                  @hash_parents);
5366
5367                 # the patch itself
5368         LINE:
5369                 while ($patch_line = <$fd>) {
5370                         chomp $patch_line;
5371
5372                         next PATCH if ($patch_line =~ m/^diff /);
5373
5374                         my $class = diff_line_class($patch_line, \%from, \%to);
5375
5376                         if ($class eq 'chunk_header') {
5377                                 print_diff_chunk($diff_style, scalar @hash_parents, \%from, \%to, @chunk);
5378                                 @chunk = ();
5379                         }
5380
5381                         push @chunk, [ $class, $patch_line ];
5382                 }
5383
5384         } continue {
5385                 if (@chunk) {
5386                         print_diff_chunk($diff_style, scalar @hash_parents, \%from, \%to, @chunk);
5387                         @chunk = ();
5388                 }
5389                 print "</div>\n"; # class="patch"
5390         }
5391
5392         # for compact combined (--cc) format, with chunk and patch simplification
5393         # the patchset might be empty, but there might be unprocessed raw lines
5394         for (++$patch_idx if $patch_number > 0;
5395              $patch_idx < @$difftree;
5396              ++$patch_idx) {
5397                 # read and prepare patch information
5398                 $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5399
5400                 # generate anchor for "patch" links in difftree / whatchanged part
5401                 print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5402                       format_diff_cc_simplified($diffinfo, @hash_parents) .
5403                       "</div>\n";  # class="patch"
5404
5405                 $patch_number++;
5406         }
5407
5408         if ($patch_number == 0) {
5409                 if (@hash_parents > 1) {
5410                         print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5411                 } else {
5412                         print "<div class=\"diff nodifferences\">No differences found</div>\n";
5413                 }
5414         }
5415
5416         print "</div>\n"; # class="patchset"
5417 }
5418
5419 # . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5420
5421 sub git_project_search_form {
5422         my ($searchtext, $search_use_regexp) = @_;
5423
5424         my $limit = '';
5425         if ($project_filter) {
5426                 $limit = " in '$project_filter/'";
5427         }
5428
5429         print "<div class=\"projsearch\">\n";
5430         print $cgi->startform(-method => 'get', -action => $my_uri) .
5431               $cgi->hidden(-name => 'a', -value => 'project_list')  . "\n";
5432         print $cgi->hidden(-name => 'pf', -value => $project_filter). "\n"
5433                 if (defined $project_filter);
5434         print $cgi->textfield(-name => 's', -value => $searchtext,
5435                               -title => "Search project by name and description$limit",
5436                               -size => 60) . "\n" .
5437               "<span title=\"Extended regular expression\">" .
5438               $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
5439                              -checked => $search_use_regexp) .
5440               "</span>\n" .
5441               $cgi->submit(-name => 'btnS', -value => 'Search') .
5442               $cgi->end_form() . "\n" .
5443               $cgi->a({-href => href(project => undef, searchtext => undef,
5444                                      project_filter => $project_filter)},
5445                       esc_html("List all projects$limit")) . "<br />\n";
5446         print "</div>\n";
5447 }
5448
5449 # entry for given @keys needs filling if at least one of keys in list
5450 # is not present in %$project_info
5451 sub project_info_needs_filling {
5452         my ($project_info, @keys) = @_;
5453
5454         # return List::MoreUtils::any { !exists $project_info->{$_} } @keys;
5455         foreach my $key (@keys) {
5456                 if (!exists $project_info->{$key}) {
5457                         return 1;
5458                 }
5459         }
5460         return;
5461 }
5462
5463 # fills project list info (age, description, owner, category, forks, etc.)
5464 # for each project in the list, removing invalid projects from
5465 # returned list, or fill only specified info.
5466 #
5467 # Invalid projects are removed from the returned list if and only if you
5468 # ask 'age' or 'age_string' to be filled, because they are the only fields
5469 # that run unconditionally git command that requires repository, and
5470 # therefore do always check if project repository is invalid.
5471 #
5472 # USAGE:
5473 # * fill_project_list_info(\@project_list, 'descr_long', 'ctags')
5474 #   ensures that 'descr_long' and 'ctags' fields are filled
5475 # * @project_list = fill_project_list_info(\@project_list)
5476 #   ensures that all fields are filled (and invalid projects removed)
5477 #
5478 # NOTE: modifies $projlist, but does not remove entries from it
5479 sub fill_project_list_info {
5480         my ($projlist, @wanted_keys) = @_;
5481         my @projects;
5482         my $filter_set = sub { return @_; };
5483         if (@wanted_keys) {
5484                 my %wanted_keys = map { $_ => 1 } @wanted_keys;
5485                 $filter_set = sub { return grep { $wanted_keys{$_} } @_; };
5486         }
5487
5488         my $show_ctags = gitweb_check_feature('ctags');
5489  PROJECT:
5490         foreach my $pr (@$projlist) {
5491                 if (project_info_needs_filling($pr, $filter_set->('age', 'age_string'))) {
5492                         my (@activity) = git_get_last_activity($pr->{'path'});
5493                         unless (@activity) {
5494                                 next PROJECT;
5495                         }
5496                         ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5497                 }
5498                 if (project_info_needs_filling($pr, $filter_set->('descr', 'descr_long'))) {
5499                         my $descr = git_get_project_description($pr->{'path'}) || "";
5500                         $descr = to_utf8($descr);
5501                         $pr->{'descr_long'} = $descr;
5502                         $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5503                 }
5504                 if (project_info_needs_filling($pr, $filter_set->('owner'))) {
5505                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5506                 }
5507                 if ($show_ctags &&
5508                     project_info_needs_filling($pr, $filter_set->('ctags'))) {
5509                         $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5510                 }
5511                 if ($projects_list_group_categories &&
5512                     project_info_needs_filling($pr, $filter_set->('category'))) {
5513                         my $cat = git_get_project_category($pr->{'path'}) ||
5514                                                            $project_list_default_category;
5515                         $pr->{'category'} = to_utf8($cat);
5516                 }
5517
5518                 push @projects, $pr;
5519         }
5520
5521         return @projects;
5522 }
5523
5524 sub sort_projects_list {
5525         my ($projlist, $order) = @_;
5526         my @projects;
5527
5528         my %order_info = (
5529                 project => { key => 'path', type => 'str' },
5530                 descr => { key => 'descr_long', type => 'str' },
5531                 owner => { key => 'owner', type => 'str' },
5532                 age => { key => 'age', type => 'num' }
5533         );
5534         my $oi = $order_info{$order};
5535         return @$projlist unless defined $oi;
5536         if ($oi->{'type'} eq 'str') {
5537                 @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5538         } else {
5539                 @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5540         }
5541
5542         return @projects;
5543 }
5544
5545 # returns a hash of categories, containing the list of project
5546 # belonging to each category
5547 sub build_projlist_by_category {
5548         my ($projlist, $from, $to) = @_;
5549         my %categories;
5550
5551         $from = 0 unless defined $from;
5552         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5553
5554         for (my $i = $from; $i <= $to; $i++) {
5555                 my $pr = $projlist->[$i];
5556                 push @{$categories{ $pr->{'category'} }}, $pr;
5557         }
5558
5559         return wantarray ? %categories : \%categories;
5560 }
5561
5562 # print 'sort by' <th> element, generating 'sort by $name' replay link
5563 # if that order is not selected
5564 sub print_sort_th {
5565         print format_sort_th(@_);
5566 }
5567
5568 sub format_sort_th {
5569         my ($name, $order, $header) = @_;
5570         my $sort_th = "";
5571         $header ||= ucfirst($name);
5572
5573         if ($order eq $name) {
5574                 $sort_th .= "<th>$header</th>\n";
5575         } else {
5576                 $sort_th .= "<th>" .
5577                             $cgi->a({-href => href(-replay=>1, order=>$name),
5578                                      -class => "header"}, $header) .
5579                             "</th>\n";
5580         }
5581
5582         return $sort_th;
5583 }
5584
5585 sub git_project_list_rows {
5586         my ($projlist, $from, $to, $check_forks) = @_;
5587
5588         $from = 0 unless defined $from;
5589         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5590
5591         my $alternate = 1;
5592         for (my $i = $from; $i <= $to; $i++) {
5593                 my $pr = $projlist->[$i];
5594
5595                 if ($alternate) {
5596                         print "<tr class=\"dark\">\n";
5597                 } else {
5598                         print "<tr class=\"light\">\n";
5599                 }
5600                 $alternate ^= 1;
5601
5602                 if ($check_forks) {
5603                         print "<td>";
5604                         if ($pr->{'forks'}) {
5605                                 my $nforks = scalar @{$pr->{'forks'}};
5606                                 if ($nforks > 0) {
5607                                         print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5608                                                        -title => "$nforks forks"}, "+");
5609                                 } else {
5610                                         print $cgi->span({-title => "$nforks forks"}, "+");
5611                                 }
5612                         }
5613                         print "</td>\n";
5614                 }
5615                 print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5616                                         -class => "list"},
5617                                        esc_html_match_hl($pr->{'path'}, $search_regexp)) .
5618                       "</td>\n" .
5619                       "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5620                                         -class => "list",
5621                                         -title => $pr->{'descr_long'}},
5622                                         $search_regexp
5623                                         ? esc_html_match_hl_chopped($pr->{'descr_long'},
5624                                                                     $pr->{'descr'}, $search_regexp)
5625                                         : esc_html($pr->{'descr'})) .
5626                       "</td>\n";
5627                 unless ($omit_owner) {
5628                         print "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5629                 }
5630                 unless ($omit_age_column) {
5631                         print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5632                             (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n";
5633                 }
5634                 print"<td class=\"link\">" .
5635                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5636                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5637                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5638                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5639                       ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5640                       "</td>\n" .
5641                       "</tr>\n";
5642         }
5643 }
5644
5645 sub git_project_list_body {
5646         # actually uses global variable $project
5647         my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5648         my @projects = @$projlist;
5649
5650         my $check_forks = gitweb_check_feature('forks');
5651         my $show_ctags  = gitweb_check_feature('ctags');
5652         my $tagfilter = $show_ctags ? $input_params{'ctag'} : undef;
5653         $check_forks = undef
5654                 if ($tagfilter || $search_regexp);
5655
5656         # filtering out forks before filling info allows to do less work
5657         @projects = filter_forks_from_projects_list(\@projects)
5658                 if ($check_forks);
5659         # search_projects_list pre-fills required info
5660         @projects = search_projects_list(\@projects,
5661                                          'search_regexp' => $search_regexp,
5662                                          'tagfilter'  => $tagfilter)
5663                 if ($tagfilter || $search_regexp);
5664         # fill the rest
5665         my @all_fields = ('descr', 'descr_long', 'ctags', 'category');
5666         push @all_fields, ('age', 'age_string') unless($omit_age_column);
5667         push @all_fields, 'owner' unless($omit_owner);
5668         @projects = fill_project_list_info(\@projects, @all_fields);
5669
5670         $order ||= $default_projects_order;
5671         $from = 0 unless defined $from;
5672         $to = $#projects if (!defined $to || $#projects < $to);
5673
5674         # short circuit
5675         if ($from > $to) {
5676                 print "<center>\n".
5677                       "<b>No such projects found</b><br />\n".
5678                       "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5679                       "</center>\n<br />\n";
5680                 return;
5681         }
5682
5683         @projects = sort_projects_list(\@projects, $order);
5684
5685         if ($show_ctags) {
5686                 my $ctags = git_gather_all_ctags(\@projects);
5687                 my $cloud = git_populate_project_tagcloud($ctags);
5688                 print git_show_project_tagcloud($cloud, 64);
5689         }
5690
5691         print "<table class=\"project_list\">\n";
5692         unless ($no_header) {
5693                 print "<tr>\n";
5694                 if ($check_forks) {
5695                         print "<th></th>\n";
5696                 }
5697                 print_sort_th('project', $order, 'Project');
5698                 print_sort_th('descr', $order, 'Description');
5699                 print_sort_th('owner', $order, 'Owner') unless $omit_owner;
5700                 print_sort_th('age', $order, 'Last Change') unless $omit_age_column;
5701                 print "<th></th>\n" . # for links
5702                       "</tr>\n";
5703         }
5704
5705         if ($projects_list_group_categories) {
5706                 # only display categories with projects in the $from-$to window
5707                 @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5708                 my %categories = build_projlist_by_category(\@projects, $from, $to);
5709                 foreach my $cat (sort keys %categories) {
5710                         unless ($cat eq "") {
5711                                 print "<tr>\n";
5712                                 if ($check_forks) {
5713                                         print "<td></td>\n";
5714                                 }
5715                                 print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5716                                 print "</tr>\n";
5717                         }
5718
5719                         git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5720                 }
5721         } else {
5722                 git_project_list_rows(\@projects, $from, $to, $check_forks);
5723         }
5724
5725         if (defined $extra) {
5726                 print "<tr>\n";
5727                 if ($check_forks) {
5728                         print "<td></td>\n";
5729                 }
5730                 print "<td colspan=\"5\">$extra</td>\n" .
5731                       "</tr>\n";
5732         }
5733         print "</table>\n";
5734 }
5735
5736 sub git_log_body {
5737         # uses global variable $project
5738         my ($commitlist, $from, $to, $refs, $extra) = @_;
5739
5740         $from = 0 unless defined $from;
5741         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5742
5743         for (my $i = 0; $i <= $to; $i++) {
5744                 my %co = %{$commitlist->[$i]};
5745                 next if !%co;
5746                 my $commit = $co{'id'};
5747                 my $ref = format_ref_marker($refs, $commit);
5748                 git_print_header_div('commit',
5749                                "<span class=\"age\">$co{'age_string'}</span>" .
5750                                esc_html($co{'title'}) . $ref,
5751                                $commit);
5752                 print "<div class=\"title_text\">\n" .
5753                       "<div class=\"log_link\">\n" .
5754                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5755                       " | " .
5756                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5757                       " | " .
5758                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5759                       "<br/>\n" .
5760                       "</div>\n";
5761                       git_print_authorship(\%co, -tag => 'span');
5762                       print "<br/>\n</div>\n";
5763
5764                 print "<div class=\"log_body\">\n";
5765                 git_print_log($co{'comment'}, -final_empty_line=> 1);
5766                 print "</div>\n";
5767         }
5768         if ($extra) {
5769                 print "<div class=\"page_nav\">\n";
5770                 print "$extra\n";
5771                 print "</div>\n";
5772         }
5773 }
5774
5775 sub git_shortlog_body {
5776         # uses global variable $project
5777         my ($commitlist, $from, $to, $refs, $extra) = @_;
5778
5779         $from = 0 unless defined $from;
5780         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5781
5782         print "<table class=\"shortlog\">\n";
5783         my $alternate = 1;
5784         for (my $i = $from; $i <= $to; $i++) {
5785                 my %co = %{$commitlist->[$i]};
5786                 my $commit = $co{'id'};
5787                 my $ref = format_ref_marker($refs, $commit);
5788                 if ($alternate) {
5789                         print "<tr class=\"dark\">\n";
5790                 } else {
5791                         print "<tr class=\"light\">\n";
5792                 }
5793                 $alternate ^= 1;
5794                 # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5795                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5796                       format_author_html('td', \%co, 10) . "<td>";
5797                 print format_subject_html($co{'title'}, $co{'title_short'},
5798                                           href(action=>"commit", hash=>$commit), $ref);
5799                 print "</td>\n" .
5800                       "<td class=\"link\">" .
5801                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5802                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5803                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5804                 my $snapshot_links = format_snapshot_links($commit);
5805                 if (defined $snapshot_links) {
5806                         print " | " . $snapshot_links;
5807                 }
5808                 print "</td>\n" .
5809                       "</tr>\n";
5810         }
5811         if (defined $extra) {
5812                 print "<tr>\n" .
5813                       "<td colspan=\"4\">$extra</td>\n" .
5814                       "</tr>\n";
5815         }
5816         print "</table>\n";
5817 }
5818
5819 sub git_history_body {
5820         # Warning: assumes constant type (blob or tree) during history
5821         my ($commitlist, $from, $to, $refs, $extra,
5822             $file_name, $file_hash, $ftype) = @_;
5823
5824         $from = 0 unless defined $from;
5825         $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5826
5827         print "<table class=\"history\">\n";
5828         my $alternate = 1;
5829         for (my $i = $from; $i <= $to; $i++) {
5830                 my %co = %{$commitlist->[$i]};
5831                 if (!%co) {
5832                         next;
5833                 }
5834                 my $commit = $co{'id'};
5835
5836                 my $ref = format_ref_marker($refs, $commit);
5837
5838                 if ($alternate) {
5839                         print "<tr class=\"dark\">\n";
5840                 } else {
5841                         print "<tr class=\"light\">\n";
5842                 }
5843                 $alternate ^= 1;
5844                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5845         # shortlog:   format_author_html('td', \%co, 10)
5846                       format_author_html('td', \%co, 15, 3) . "<td>";
5847                 # originally git_history used chop_str($co{'title'}, 50)
5848                 print format_subject_html($co{'title'}, $co{'title_short'},
5849                                           href(action=>"commit", hash=>$commit), $ref);
5850                 print "</td>\n" .
5851                       "<td class=\"link\">" .
5852                       $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5853                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5854
5855                 if ($ftype eq 'blob') {
5856                         my $blob_current = $file_hash;
5857                         my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5858                         if (defined $blob_current && defined $blob_parent &&
5859                                         $blob_current ne $blob_parent) {
5860                                 print " | " .
5861                                         $cgi->a({-href => href(action=>"blobdiff",
5862                                                                hash=>$blob_current, hash_parent=>$blob_parent,
5863                                                                hash_base=>$hash_base, hash_parent_base=>$commit,
5864                                                                file_name=>$file_name)},
5865                                                 "diff to current");
5866                         }
5867                 }
5868                 print "</td>\n" .
5869                       "</tr>\n";
5870         }
5871         if (defined $extra) {
5872                 print "<tr>\n" .
5873                       "<td colspan=\"4\">$extra</td>\n" .
5874                       "</tr>\n";
5875         }
5876         print "</table>\n";
5877 }
5878
5879 sub git_tags_body {
5880         # uses global variable $project
5881         my ($taglist, $from, $to, $extra) = @_;
5882         $from = 0 unless defined $from;
5883         $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5884
5885         print "<table class=\"tags\">\n";
5886         my $alternate = 1;
5887         for (my $i = $from; $i <= $to; $i++) {
5888                 my $entry = $taglist->[$i];
5889                 my %tag = %$entry;
5890                 my $comment = $tag{'subject'};
5891                 my $comment_short;
5892                 if (defined $comment) {
5893                         $comment_short = chop_str($comment, 30, 5);
5894                 }
5895                 if ($alternate) {
5896                         print "<tr class=\"dark\">\n";
5897                 } else {
5898                         print "<tr class=\"light\">\n";
5899                 }
5900                 $alternate ^= 1;
5901                 if (defined $tag{'age'}) {
5902                         print "<td><i>$tag{'age'}</i></td>\n";
5903                 } else {
5904                         print "<td></td>\n";
5905                 }
5906                 print "<td>" .
5907                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5908                                -class => "list name"}, esc_html($tag{'name'})) .
5909                       "</td>\n" .
5910                       "<td>";
5911                 if (defined $comment) {
5912                         print format_subject_html($comment, $comment_short,
5913                                                   href(action=>"tag", hash=>$tag{'id'}));
5914                 }
5915                 print "</td>\n" .
5916                       "<td class=\"selflink\">";
5917                 if ($tag{'type'} eq "tag") {
5918                         print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5919                 } else {
5920                         print "&nbsp;";
5921                 }
5922                 print "</td>\n" .
5923                       "<td class=\"link\">" . " | " .
5924                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5925                 if ($tag{'reftype'} eq "commit") {
5926                         print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5927                               " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5928                 } elsif ($tag{'reftype'} eq "blob") {
5929                         print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5930                 }
5931                 print "</td>\n" .
5932                       "</tr>";
5933         }
5934         if (defined $extra) {
5935                 print "<tr>\n" .
5936                       "<td colspan=\"5\">$extra</td>\n" .
5937                       "</tr>\n";
5938         }
5939         print "</table>\n";
5940 }
5941
5942 sub git_heads_body {
5943         # uses global variable $project
5944         my ($headlist, $head_at, $from, $to, $extra) = @_;
5945         $from = 0 unless defined $from;
5946         $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5947
5948         print "<table class=\"heads\">\n";
5949         my $alternate = 1;
5950         for (my $i = $from; $i <= $to; $i++) {
5951                 my $entry = $headlist->[$i];
5952                 my %ref = %$entry;
5953                 my $curr = defined $head_at && $ref{'id'} eq $head_at;
5954                 if ($alternate) {
5955                         print "<tr class=\"dark\">\n";
5956                 } else {
5957                         print "<tr class=\"light\">\n";
5958                 }
5959                 $alternate ^= 1;
5960                 print "<td><i>$ref{'age'}</i></td>\n" .
5961                       ($curr ? "<td class=\"current_head\">" : "<td>") .
5962                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5963                                -class => "list name"},esc_html($ref{'name'})) .
5964                       "</td>\n" .
5965                       "<td class=\"link\">" .
5966                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5967                       $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5968                       $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5969                       "</td>\n" .
5970                       "</tr>";
5971         }
5972         if (defined $extra) {
5973                 print "<tr>\n" .
5974                       "<td colspan=\"3\">$extra</td>\n" .
5975                       "</tr>\n";
5976         }
5977         print "</table>\n";
5978 }
5979
5980 # Display a single remote block
5981 sub git_remote_block {
5982         my ($remote, $rdata, $limit, $head) = @_;
5983
5984         my $heads = $rdata->{'heads'};
5985         my $fetch = $rdata->{'fetch'};
5986         my $push = $rdata->{'push'};
5987
5988         my $urls_table = "<table class=\"projects_list\">\n" ;
5989
5990         if (defined $fetch) {
5991                 if ($fetch eq $push) {
5992                         $urls_table .= format_repo_url("URL", $fetch);
5993                 } else {
5994                         $urls_table .= format_repo_url("Fetch URL", $fetch);
5995                         $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5996                 }
5997         } elsif (defined $push) {
5998                 $urls_table .= format_repo_url("Push URL", $push);
5999         } else {
6000                 $urls_table .= format_repo_url("", "No remote URL");
6001         }
6002
6003         $urls_table .= "</table>\n";
6004
6005         my $dots;
6006         if (defined $limit && $limit < @$heads) {
6007                 $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
6008         }
6009
6010         print $urls_table;
6011         git_heads_body($heads, $head, 0, $limit, $dots);
6012 }
6013
6014 # Display a list of remote names with the respective fetch and push URLs
6015 sub git_remotes_list {
6016         my ($remotedata, $limit) = @_;
6017         print "<table class=\"heads\">\n";
6018         my $alternate = 1;
6019         my @remotes = sort keys %$remotedata;
6020
6021         my $limited = $limit && $limit < @remotes;
6022
6023         $#remotes = $limit - 1 if $limited;
6024
6025         while (my $remote = shift @remotes) {
6026                 my $rdata = $remotedata->{$remote};
6027                 my $fetch = $rdata->{'fetch'};
6028                 my $push = $rdata->{'push'};
6029                 if ($alternate) {
6030                         print "<tr class=\"dark\">\n";
6031                 } else {
6032                         print "<tr class=\"light\">\n";
6033                 }
6034                 $alternate ^= 1;
6035                 print "<td>" .
6036                       $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
6037                                -class=> "list name"},esc_html($remote)) .
6038                       "</td>";
6039                 print "<td class=\"link\">" .
6040                       (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
6041                       " | " .
6042                       (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
6043                       "</td>";
6044
6045                 print "</tr>\n";
6046         }
6047
6048         if ($limited) {
6049                 print "<tr>\n" .
6050                       "<td colspan=\"3\">" .
6051                       $cgi->a({-href => href(action=>"remotes")}, "...") .
6052                       "</td>\n" . "</tr>\n";
6053         }
6054
6055         print "</table>";
6056 }
6057
6058 # Display remote heads grouped by remote, unless there are too many
6059 # remotes, in which case we only display the remote names
6060 sub git_remotes_body {
6061         my ($remotedata, $limit, $head) = @_;
6062         if ($limit and $limit < keys %$remotedata) {
6063                 git_remotes_list($remotedata, $limit);
6064         } else {
6065                 fill_remote_heads($remotedata);
6066                 while (my ($remote, $rdata) = each %$remotedata) {
6067                         git_print_section({-class=>"remote", -id=>$remote},
6068                                 ["remotes", $remote, $remote], sub {
6069                                         git_remote_block($remote, $rdata, $limit, $head);
6070                                 });
6071                 }
6072         }
6073 }
6074
6075 sub git_search_message {
6076         my %co = @_;
6077
6078         my $greptype;
6079         if ($searchtype eq 'commit') {
6080                 $greptype = "--grep=";
6081         } elsif ($searchtype eq 'author') {
6082                 $greptype = "--author=";
6083         } elsif ($searchtype eq 'committer') {
6084                 $greptype = "--committer=";
6085         }
6086         $greptype .= $searchtext;
6087         my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
6088                                        $greptype, '--regexp-ignore-case',
6089                                        $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
6090
6091         my $paging_nav = '';
6092         if ($page > 0) {
6093                 $paging_nav .=
6094                         $cgi->a({-href => href(-replay=>1, page=>undef)},
6095                                 "first") .
6096                         " &sdot; " .
6097                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
6098                                  -accesskey => "p", -title => "Alt-p"}, "prev");
6099         } else {
6100                 $paging_nav .= "first &sdot; prev";
6101         }
6102         my $next_link = '';
6103         if ($#commitlist >= 100) {
6104                 $next_link =
6105                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
6106                                  -accesskey => "n", -title => "Alt-n"}, "next");
6107                 $paging_nav .= " &sdot; $next_link";
6108         } else {
6109                 $paging_nav .= " &sdot; next";
6110         }
6111
6112         git_header_html();
6113
6114         git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
6115         git_print_header_div('commit', esc_html($co{'title'}), $hash);
6116         if ($page == 0 && !@commitlist) {
6117                 print "<p>No match.</p>\n";
6118         } else {
6119                 git_search_grep_body(\@commitlist, 0, 99, $next_link);
6120         }
6121
6122         git_footer_html();
6123 }
6124
6125 sub git_search_changes {
6126         my %co = @_;
6127
6128         local $/ = "\n";
6129         open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
6130                 '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
6131                 ($search_use_regexp ? '--pickaxe-regex' : ())
6132                         or die_error(500, "Open git-log failed");
6133
6134         git_header_html();
6135
6136         git_print_page_nav('','', $hash,$co{'tree'},$hash);
6137         git_print_header_div('commit', esc_html($co{'title'}), $hash);
6138
6139         print "<table class=\"pickaxe search\">\n";
6140         my $alternate = 1;
6141         undef %co;
6142         my @files;
6143         while (my $line = <$fd>) {
6144                 chomp $line;
6145                 next unless $line;
6146
6147                 my %set = parse_difftree_raw_line($line);
6148                 if (defined $set{'commit'}) {
6149                         # finish previous commit
6150                         if (%co) {
6151                                 print "</td>\n" .
6152                                       "<td class=\"link\">" .
6153                                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
6154                                               "commit") .
6155                                       " | " .
6156                                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
6157                                                              hash_base=>$co{'id'})},
6158                                               "tree") .
6159                                       "</td>\n" .
6160                                       "</tr>\n";
6161                         }
6162
6163                         if ($alternate) {
6164                                 print "<tr class=\"dark\">\n";
6165                         } else {
6166                                 print "<tr class=\"light\">\n";
6167                         }
6168                         $alternate ^= 1;
6169                         %co = parse_commit($set{'commit'});
6170                         my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6171                         print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6172                               "<td><i>$author</i></td>\n" .
6173                               "<td>" .
6174                               $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6175                                       -class => "list subject"},
6176                                       chop_and_escape_str($co{'title'}, 50) . "<br/>");
6177                 } elsif (defined $set{'to_id'}) {
6178                         next if ($set{'to_id'} =~ m/^0{40}$/);
6179
6180                         print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6181                                                      hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6182                                       -class => "list"},
6183                                       "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6184                               "<br/>\n";
6185                 }
6186         }
6187         close $fd;
6188
6189         # finish last commit (warning: repetition!)
6190         if (%co) {
6191                 print "</td>\n" .
6192                       "<td class=\"link\">" .
6193                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
6194                               "commit") .
6195                       " | " .
6196                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
6197                                              hash_base=>$co{'id'})},
6198                               "tree") .
6199                       "</td>\n" .
6200                       "</tr>\n";
6201         }
6202
6203         print "</table>\n";
6204
6205         git_footer_html();
6206 }
6207
6208 sub git_search_files {
6209         my %co = @_;
6210
6211         local $/ = "\n";
6212         open my $fd, "-|", git_cmd(), 'grep', '-n', '-z',
6213                 $search_use_regexp ? ('-E', '-i') : '-F',
6214                 $searchtext, $co{'tree'}
6215                         or die_error(500, "Open git-grep failed");
6216
6217         git_header_html();
6218
6219         git_print_page_nav('','', $hash,$co{'tree'},$hash);
6220         git_print_header_div('commit', esc_html($co{'title'}), $hash);
6221
6222         print "<table class=\"grep_search\">\n";
6223         my $alternate = 1;
6224         my $matches = 0;
6225         my $lastfile = '';
6226         my $file_href;
6227         while (my $line = <$fd>) {
6228                 chomp $line;
6229                 my ($file, $lno, $ltext, $binary);
6230                 last if ($matches++ > 1000);
6231                 if ($line =~ /^Binary file (.+) matches$/) {
6232                         $file = $1;
6233                         $binary = 1;
6234                 } else {
6235                         ($file, $lno, $ltext) = split(/\0/, $line, 3);
6236                         $file =~ s/^$co{'tree'}://;
6237                 }
6238                 if ($file ne $lastfile) {
6239                         $lastfile and print "</td></tr>\n";
6240                         if ($alternate++) {
6241                                 print "<tr class=\"dark\">\n";
6242                         } else {
6243                                 print "<tr class=\"light\">\n";
6244                         }
6245                         $file_href = href(action=>"blob", hash_base=>$co{'id'},
6246                                           file_name=>$file);
6247                         print "<td class=\"list\">".
6248                                 $cgi->a({-href => $file_href, -class => "list"}, esc_path($file));
6249                         print "</td><td>\n";
6250                         $lastfile = $file;
6251                 }
6252                 if ($binary) {
6253                         print "<div class=\"binary\">Binary file</div>\n";
6254                 } else {
6255                         $ltext = untabify($ltext);
6256                         if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6257                                 $ltext = esc_html($1, -nbsp=>1);
6258                                 $ltext .= '<span class="match">';
6259                                 $ltext .= esc_html($2, -nbsp=>1);
6260                                 $ltext .= '</span>';
6261                                 $ltext .= esc_html($3, -nbsp=>1);
6262                         } else {
6263                                 $ltext = esc_html($ltext, -nbsp=>1);
6264                         }
6265                         print "<div class=\"pre\">" .
6266                                 $cgi->a({-href => $file_href.'#l'.$lno,
6267                                         -class => "linenr"}, sprintf('%4i', $lno)) .
6268                                 ' ' .  $ltext . "</div>\n";
6269                 }
6270         }
6271         if ($lastfile) {
6272                 print "</td></tr>\n";
6273                 if ($matches > 1000) {
6274                         print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6275                 }
6276         } else {
6277                 print "<div class=\"diff nodifferences\">No matches found</div>\n";
6278         }
6279         close $fd;
6280
6281         print "</table>\n";
6282
6283         git_footer_html();
6284 }
6285
6286 sub git_search_grep_body {
6287         my ($commitlist, $from, $to, $extra) = @_;
6288         $from = 0 unless defined $from;
6289         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
6290
6291         print "<table class=\"commit_search\">\n";
6292         my $alternate = 1;
6293         for (my $i = $from; $i <= $to; $i++) {
6294                 my %co = %{$commitlist->[$i]};
6295                 if (!%co) {
6296                         next;
6297                 }
6298                 my $commit = $co{'id'};
6299                 if ($alternate) {
6300                         print "<tr class=\"dark\">\n";
6301                 } else {
6302                         print "<tr class=\"light\">\n";
6303                 }
6304                 $alternate ^= 1;
6305                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6306                       format_author_html('td', \%co, 15, 5) .
6307                       "<td>" .
6308                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6309                                -class => "list subject"},
6310                               chop_and_escape_str($co{'title'}, 50) . "<br/>");
6311                 my $comment = $co{'comment'};
6312                 foreach my $line (@$comment) {
6313                         if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
6314                                 my ($lead, $match, $trail) = ($1, $2, $3);
6315                                 $match = chop_str($match, 70, 5, 'center');
6316                                 my $contextlen = int((80 - length($match))/2);
6317                                 $contextlen = 30 if ($contextlen > 30);
6318                                 $lead  = chop_str($lead,  $contextlen, 10, 'left');
6319                                 $trail = chop_str($trail, $contextlen, 10, 'right');
6320
6321                                 $lead  = esc_html($lead);
6322                                 $match = esc_html($match);
6323                                 $trail = esc_html($trail);
6324
6325                                 print "$lead<span class=\"match\">$match</span>$trail<br />";
6326                         }
6327                 }
6328                 print "</td>\n" .
6329                       "<td class=\"link\">" .
6330                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6331                       " | " .
6332                       $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
6333                       " | " .
6334                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6335                 print "</td>\n" .
6336                       "</tr>\n";
6337         }
6338         if (defined $extra) {
6339                 print "<tr>\n" .
6340                       "<td colspan=\"3\">$extra</td>\n" .
6341                       "</tr>\n";
6342         }
6343         print "</table>\n";
6344 }
6345
6346 ## ======================================================================
6347 ## ======================================================================
6348 ## actions
6349
6350 sub git_project_list {
6351         my $order = $input_params{'order'};
6352         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6353                 die_error(400, "Unknown order parameter");
6354         }
6355
6356         my @list = git_get_projects_list($project_filter, $strict_export);
6357         if (!@list) {
6358                 die_error(404, "No projects found");
6359         }
6360
6361         git_header_html();
6362         if (defined $home_text && -f $home_text) {
6363                 print "<div class=\"index_include\">\n";
6364                 insert_file($home_text);
6365                 print "</div>\n";
6366         }
6367
6368         git_project_search_form($searchtext, $search_use_regexp);
6369         git_project_list_body(\@list, $order);
6370         git_footer_html();
6371 }
6372
6373 sub git_forks {
6374         my $order = $input_params{'order'};
6375         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6376                 die_error(400, "Unknown order parameter");
6377         }
6378
6379         my $filter = $project;
6380         $filter =~ s/\.git$//;
6381         my @list = git_get_projects_list($filter);
6382         if (!@list) {
6383                 die_error(404, "No forks found");
6384         }
6385
6386         git_header_html();
6387         git_print_page_nav('','');
6388         git_print_header_div('summary', "$project forks");
6389         git_project_list_body(\@list, $order);
6390         git_footer_html();
6391 }
6392
6393 sub git_project_index {
6394         my @projects = git_get_projects_list($project_filter, $strict_export);
6395         if (!@projects) {
6396                 die_error(404, "No projects found");
6397         }
6398
6399         print $cgi->header(
6400                 -type => 'text/plain',
6401                 -charset => 'utf-8',
6402                 -content_disposition => 'inline; filename="index.aux"');
6403
6404         foreach my $pr (@projects) {
6405                 if (!exists $pr->{'owner'}) {
6406                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6407                 }
6408
6409                 my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6410                 # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6411                 $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6412                 $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6413                 $path  =~ s/ /\+/g;
6414                 $owner =~ s/ /\+/g;
6415
6416                 print "$path $owner\n";
6417         }
6418 }
6419
6420 sub git_summary {
6421         my $descr = git_get_project_description($project) || "none";
6422         my %co = parse_commit("HEAD");
6423         my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6424         my $head = $co{'id'};
6425         my $remote_heads = gitweb_check_feature('remote_heads');
6426
6427         my $owner = git_get_project_owner($project);
6428
6429         my $refs = git_get_references();
6430         # These get_*_list functions return one more to allow us to see if
6431         # there are more ...
6432         my @taglist  = git_get_tags_list(16);
6433         my @headlist = git_get_heads_list(16);
6434         my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6435         my @forklist;
6436         my $check_forks = gitweb_check_feature('forks');
6437
6438         if ($check_forks) {
6439                 # find forks of a project
6440                 my $filter = $project;
6441                 $filter =~ s/\.git$//;
6442                 @forklist = git_get_projects_list($filter);
6443                 # filter out forks of forks
6444                 @forklist = filter_forks_from_projects_list(\@forklist)
6445                         if (@forklist);
6446         }
6447
6448         git_header_html();
6449         git_print_page_nav('summary','', $head);
6450
6451         print "<div class=\"title\">&nbsp;</div>\n";
6452         print "<table class=\"projects_list\">\n" .
6453               "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n";
6454         unless ($omit_owner) {
6455                 print  "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6456         }
6457         if (defined $cd{'rfc2822'}) {
6458                 print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6459                       "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6460         }
6461
6462         # use per project git URL list in $projectroot/$project/cloneurl
6463         # or make project git URL from git base URL and project name
6464         my $url_tag = "URL";
6465         my @url_list = git_get_project_url_list($project);
6466         @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6467         foreach my $git_url (@url_list) {
6468                 next unless $git_url;
6469                 print format_repo_url($url_tag, $git_url);
6470                 $url_tag = "";
6471         }
6472
6473         # Tag cloud
6474         my $show_ctags = gitweb_check_feature('ctags');
6475         if ($show_ctags) {
6476                 my $ctags = git_get_project_ctags($project);
6477                 if (%$ctags) {
6478                         # without ability to add tags, don't show if there are none
6479                         my $cloud = git_populate_project_tagcloud($ctags);
6480                         print "<tr id=\"metadata_ctags\">" .
6481                               "<td>content tags</td>" .
6482                               "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6483                               "</tr>\n";
6484                 }
6485         }
6486
6487         print "</table>\n";
6488
6489         # If XSS prevention is on, we don't include README.html.
6490         # TODO: Allow a readme in some safe format.
6491         if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6492                 print "<div class=\"title\">readme</div>\n" .
6493                       "<div class=\"readme\">\n";
6494                 insert_file("$projectroot/$project/README.html");
6495                 print "\n</div>\n"; # class="readme"
6496         }
6497
6498         # we need to request one more than 16 (0..15) to check if
6499         # those 16 are all
6500         my @commitlist = $head ? parse_commits($head, 17) : ();
6501         if (@commitlist) {
6502                 git_print_header_div('shortlog');
6503                 git_shortlog_body(\@commitlist, 0, 15, $refs,
6504                                   $#commitlist <=  15 ? undef :
6505                                   $cgi->a({-href => href(action=>"shortlog")}, "..."));
6506         }
6507
6508         if (@taglist) {
6509                 git_print_header_div('tags');
6510                 git_tags_body(\@taglist, 0, 15,
6511                               $#taglist <=  15 ? undef :
6512                               $cgi->a({-href => href(action=>"tags")}, "..."));
6513         }
6514
6515         if (@headlist) {
6516                 git_print_header_div('heads');
6517                 git_heads_body(\@headlist, $head, 0, 15,
6518                                $#headlist <= 15 ? undef :
6519                                $cgi->a({-href => href(action=>"heads")}, "..."));
6520         }
6521
6522         if (%remotedata) {
6523                 git_print_header_div('remotes');
6524                 git_remotes_body(\%remotedata, 15, $head);
6525         }
6526
6527         if (@forklist) {
6528                 git_print_header_div('forks');
6529                 git_project_list_body(\@forklist, 'age', 0, 15,
6530                                       $#forklist <= 15 ? undef :
6531                                       $cgi->a({-href => href(action=>"forks")}, "..."),
6532                                       'no_header');
6533         }
6534
6535         git_footer_html();
6536 }
6537
6538 sub git_tag {
6539         my %tag = parse_tag($hash);
6540
6541         if (! %tag) {
6542                 die_error(404, "Unknown tag object");
6543         }
6544
6545         my $head = git_get_head_hash($project);
6546         git_header_html();
6547         git_print_page_nav('','', $head,undef,$head);
6548         git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6549         print "<div class=\"title_text\">\n" .
6550               "<table class=\"object_header\">\n" .
6551               "<tr>\n" .
6552               "<td>object</td>\n" .
6553               "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6554                                $tag{'object'}) . "</td>\n" .
6555               "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6556                                               $tag{'type'}) . "</td>\n" .
6557               "</tr>\n";
6558         if (defined($tag{'author'})) {
6559                 git_print_authorship_rows(\%tag, 'author');
6560         }
6561         print "</table>\n\n" .
6562               "</div>\n";
6563         print "<div class=\"page_body\">";
6564         my $comment = $tag{'comment'};
6565         foreach my $line (@$comment) {
6566                 chomp $line;
6567                 print esc_html($line, -nbsp=>1) . "<br/>\n";
6568         }
6569         print "</div>\n";
6570         git_footer_html();
6571 }
6572
6573 sub git_blame_common {
6574         my $format = shift || 'porcelain';
6575         if ($format eq 'porcelain' && $input_params{'javascript'}) {
6576                 $format = 'incremental';
6577                 $action = 'blame_incremental'; # for page title etc
6578         }
6579
6580         # permissions
6581         gitweb_check_feature('blame')
6582                 or die_error(403, "Blame view not allowed");
6583
6584         # error checking
6585         die_error(400, "No file name given") unless $file_name;
6586         $hash_base ||= git_get_head_hash($project);
6587         die_error(404, "Couldn't find base commit") unless $hash_base;
6588         my %co = parse_commit($hash_base)
6589                 or die_error(404, "Commit not found");
6590         my $ftype = "blob";
6591         if (!defined $hash) {
6592                 $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6593                         or die_error(404, "Error looking up file");
6594         } else {
6595                 $ftype = git_get_type($hash);
6596                 if ($ftype !~ "blob") {
6597                         die_error(400, "Object is not a blob");
6598                 }
6599         }
6600
6601         my $fd;
6602         if ($format eq 'incremental') {
6603                 # get file contents (as base)
6604                 open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6605                         or die_error(500, "Open git-cat-file failed");
6606         } elsif ($format eq 'data') {
6607                 # run git-blame --incremental
6608                 open $fd, "-|", git_cmd(), "blame", "--incremental",
6609                         $hash_base, "--", $file_name
6610                         or die_error(500, "Open git-blame --incremental failed");
6611         } else {
6612                 # run git-blame --porcelain
6613                 open $fd, "-|", git_cmd(), "blame", '-p',
6614                         $hash_base, '--', $file_name
6615                         or die_error(500, "Open git-blame --porcelain failed");
6616         }
6617
6618         # incremental blame data returns early
6619         if ($format eq 'data') {
6620                 print $cgi->header(
6621                         -type=>"text/plain", -charset => "utf-8",
6622                         -status=> "200 OK");
6623                 local $| = 1; # output autoflush
6624                 while (my $line = <$fd>) {
6625                         print to_utf8($line);
6626                 }
6627                 close $fd
6628                         or print "ERROR $!\n";
6629
6630                 print 'END';
6631                 if (defined $t0 && gitweb_check_feature('timed')) {
6632                         print ' '.
6633                               tv_interval($t0, [ gettimeofday() ]).
6634                               ' '.$number_of_git_cmds;
6635                 }
6636                 print "\n";
6637
6638                 return;
6639         }
6640
6641         # page header
6642         git_header_html();
6643         my $formats_nav =
6644                 $cgi->a({-href => href(action=>"blob", -replay=>1)},
6645                         "blob") .
6646                 " | ";
6647         if ($format eq 'incremental') {
6648                 $formats_nav .=
6649                         $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6650                                 "blame") . " (non-incremental)";
6651         } else {
6652                 $formats_nav .=
6653                         $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6654                                 "blame") . " (incremental)";
6655         }
6656         $formats_nav .=
6657                 " | " .
6658                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6659                         "history") .
6660                 " | " .
6661                 $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6662                         "HEAD");
6663         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6664         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6665         git_print_page_path($file_name, $ftype, $hash_base);
6666
6667         # page body
6668         if ($format eq 'incremental') {
6669                 print "<noscript>\n<div class=\"error\"><center><b>\n".
6670                       "This page requires JavaScript to run.\n Use ".
6671                       $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6672                               'this page').
6673                       " instead.\n".
6674                       "</b></center></div>\n</noscript>\n";
6675
6676                 print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6677         }
6678
6679         print qq!<div class="page_body">\n!;
6680         print qq!<div id="progress_info">... / ...</div>\n!
6681                 if ($format eq 'incremental');
6682         print qq!<table id="blame_table" class="blame" width="100%">\n!.
6683               #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6684               qq!<thead>\n!.
6685               qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6686               qq!</thead>\n!.
6687               qq!<tbody>\n!;
6688
6689         my @rev_color = qw(light dark);
6690         my $num_colors = scalar(@rev_color);
6691         my $current_color = 0;
6692
6693         if ($format eq 'incremental') {
6694                 my $color_class = $rev_color[$current_color];
6695
6696                 #contents of a file
6697                 my $linenr = 0;
6698         LINE:
6699                 while (my $line = <$fd>) {
6700                         chomp $line;
6701                         $linenr++;
6702
6703                         print qq!<tr id="l$linenr" class="$color_class">!.
6704                               qq!<td class="sha1"><a href=""> </a></td>!.
6705                               qq!<td class="linenr">!.
6706                               qq!<a class="linenr" href="">$linenr</a></td>!;
6707                         print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6708                         print qq!</tr>\n!;
6709                 }
6710
6711         } else { # porcelain, i.e. ordinary blame
6712                 my %metainfo = (); # saves information about commits
6713
6714                 # blame data
6715         LINE:
6716                 while (my $line = <$fd>) {
6717                         chomp $line;
6718                         # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6719                         # no <lines in group> for subsequent lines in group of lines
6720                         my ($full_rev, $orig_lineno, $lineno, $group_size) =
6721                            ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6722                         if (!exists $metainfo{$full_rev}) {
6723                                 $metainfo{$full_rev} = { 'nprevious' => 0 };
6724                         }
6725                         my $meta = $metainfo{$full_rev};
6726                         my $data;
6727                         while ($data = <$fd>) {
6728                                 chomp $data;
6729                                 last if ($data =~ s/^\t//); # contents of line
6730                                 if ($data =~ /^(\S+)(?: (.*))?$/) {
6731                                         $meta->{$1} = $2 unless exists $meta->{$1};
6732                                 }
6733                                 if ($data =~ /^previous /) {
6734                                         $meta->{'nprevious'}++;
6735                                 }
6736                         }
6737                         my $short_rev = substr($full_rev, 0, 8);
6738                         my $author = $meta->{'author'};
6739                         my %date =
6740                                 parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6741                         my $date = $date{'iso-tz'};
6742                         if ($group_size) {
6743                                 $current_color = ($current_color + 1) % $num_colors;
6744                         }
6745                         my $tr_class = $rev_color[$current_color];
6746                         $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6747                         $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6748                         $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6749                         print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6750                         if ($group_size) {
6751                                 print "<td class=\"sha1\"";
6752                                 print " title=\"". esc_html($author) . ", $date\"";
6753                                 print " rowspan=\"$group_size\"" if ($group_size > 1);
6754                                 print ">";
6755                                 print $cgi->a({-href => href(action=>"commit",
6756                                                              hash=>$full_rev,
6757                                                              file_name=>$file_name)},
6758                                               esc_html($short_rev));
6759                                 if ($group_size >= 2) {
6760                                         my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6761                                         if (@author_initials) {
6762                                                 print "<br />" .
6763                                                       esc_html(join('', @author_initials));
6764                                                 #           or join('.', ...)
6765                                         }
6766                                 }
6767                                 print "</td>\n";
6768                         }
6769                         # 'previous' <sha1 of parent commit> <filename at commit>
6770                         if (exists $meta->{'previous'} &&
6771                             $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6772                                 $meta->{'parent'} = $1;
6773                                 $meta->{'file_parent'} = unquote($2);
6774                         }
6775                         my $linenr_commit =
6776                                 exists($meta->{'parent'}) ?
6777                                 $meta->{'parent'} : $full_rev;
6778                         my $linenr_filename =
6779                                 exists($meta->{'file_parent'}) ?
6780                                 $meta->{'file_parent'} : unquote($meta->{'filename'});
6781                         my $blamed = href(action => 'blame',
6782                                           file_name => $linenr_filename,
6783                                           hash_base => $linenr_commit);
6784                         print "<td class=\"linenr\">";
6785                         print $cgi->a({ -href => "$blamed#l$orig_lineno",
6786                                         -class => "linenr" },
6787                                       esc_html($lineno));
6788                         print "</td>";
6789                         print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6790                         print "</tr>\n";
6791                 } # end while
6792
6793         }
6794
6795         # footer
6796         print "</tbody>\n".
6797               "</table>\n"; # class="blame"
6798         print "</div>\n";   # class="blame_body"
6799         close $fd
6800                 or print "Reading blob failed\n";
6801
6802         git_footer_html();
6803 }
6804
6805 sub git_blame {
6806         git_blame_common();
6807 }
6808
6809 sub git_blame_incremental {
6810         git_blame_common('incremental');
6811 }
6812
6813 sub git_blame_data {
6814         git_blame_common('data');
6815 }
6816
6817 sub git_tags {
6818         my $head = git_get_head_hash($project);
6819         git_header_html();
6820         git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6821         git_print_header_div('summary', $project);
6822
6823         my @tagslist = git_get_tags_list();
6824         if (@tagslist) {
6825                 git_tags_body(\@tagslist);
6826         }
6827         git_footer_html();
6828 }
6829
6830 sub git_heads {
6831         my $head = git_get_head_hash($project);
6832         git_header_html();
6833         git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6834         git_print_header_div('summary', $project);
6835
6836         my @headslist = git_get_heads_list();
6837         if (@headslist) {
6838                 git_heads_body(\@headslist, $head);
6839         }
6840         git_footer_html();
6841 }
6842
6843 # used both for single remote view and for list of all the remotes
6844 sub git_remotes {
6845         gitweb_check_feature('remote_heads')
6846                 or die_error(403, "Remote heads view is disabled");
6847
6848         my $head = git_get_head_hash($project);
6849         my $remote = $input_params{'hash'};
6850
6851         my $remotedata = git_get_remotes_list($remote);
6852         die_error(500, "Unable to get remote information") unless defined $remotedata;
6853
6854         unless (%$remotedata) {
6855                 die_error(404, defined $remote ?
6856                         "Remote $remote not found" :
6857                         "No remotes found");
6858         }
6859
6860         git_header_html(undef, undef, -action_extra => $remote);
6861         git_print_page_nav('', '',  $head, undef, $head,
6862                 format_ref_views($remote ? '' : 'remotes'));
6863
6864         fill_remote_heads($remotedata);
6865         if (defined $remote) {
6866                 git_print_header_div('remotes', "$remote remote for $project");
6867                 git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6868         } else {
6869                 git_print_header_div('summary', "$project remotes");
6870                 git_remotes_body($remotedata, undef, $head);
6871         }
6872
6873         git_footer_html();
6874 }
6875
6876 sub git_blob_plain {
6877         my $type = shift;
6878         my $expires;
6879
6880         if (!defined $hash) {
6881                 if (defined $file_name) {
6882                         my $base = $hash_base || git_get_head_hash($project);
6883                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6884                                 or die_error(404, "Cannot find file");
6885                 } else {
6886                         die_error(400, "No file name defined");
6887                 }
6888         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6889                 # blobs defined by non-textual hash id's can be cached
6890                 $expires = "+1d";
6891         }
6892
6893         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6894                 or die_error(500, "Open git-cat-file blob '$hash' failed");
6895
6896         # content-type (can include charset)
6897         $type = blob_contenttype($fd, $file_name, $type);
6898
6899         # "save as" filename, even when no $file_name is given
6900         my $save_as = "$hash";
6901         if (defined $file_name) {
6902                 $save_as = $file_name;
6903         } elsif ($type =~ m/^text\//) {
6904                 $save_as .= '.txt';
6905         }
6906
6907         # With XSS prevention on, blobs of all types except a few known safe
6908         # ones are served with "Content-Disposition: attachment" to make sure
6909         # they don't run in our security domain.  For certain image types,
6910         # blob view writes an <img> tag referring to blob_plain view, and we
6911         # want to be sure not to break that by serving the image as an
6912         # attachment (though Firefox 3 doesn't seem to care).
6913         my $sandbox = $prevent_xss &&
6914                 $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6915
6916         # serve text/* as text/plain
6917         if ($prevent_xss &&
6918             ($type =~ m!^text/[a-z]+\b(.*)$! ||
6919              ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
6920                 my $rest = $1;
6921                 $rest = defined $rest ? $rest : '';
6922                 $type = "text/plain$rest";
6923         }
6924
6925         print $cgi->header(
6926                 -type => $type,
6927                 -expires => $expires,
6928                 -content_disposition =>
6929                         ($sandbox ? 'attachment' : 'inline')
6930                         . '; filename="' . $save_as . '"');
6931         local $/ = undef;
6932         binmode STDOUT, ':raw';
6933         print <$fd>;
6934         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6935         close $fd;
6936 }
6937
6938 sub git_blob {
6939         my $expires;
6940
6941         if (!defined $hash) {
6942                 if (defined $file_name) {
6943                         my $base = $hash_base || git_get_head_hash($project);
6944                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6945                                 or die_error(404, "Cannot find file");
6946                 } else {
6947                         die_error(400, "No file name defined");
6948                 }
6949         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6950                 # blobs defined by non-textual hash id's can be cached
6951                 $expires = "+1d";
6952         }
6953
6954         my $have_blame = gitweb_check_feature('blame');
6955         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6956                 or die_error(500, "Couldn't cat $file_name, $hash");
6957         my $mimetype = blob_mimetype($fd, $file_name);
6958         # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6959         if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6960                 close $fd;
6961                 return git_blob_plain($mimetype);
6962         }
6963         # we can have blame only for text/* mimetype
6964         $have_blame &&= ($mimetype =~ m!^text/!);
6965
6966         my $highlight = gitweb_check_feature('highlight');
6967         my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6968         $fd = run_highlighter($fd, $highlight, $syntax)
6969                 if $syntax;
6970
6971         git_header_html(undef, $expires);
6972         my $formats_nav = '';
6973         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6974                 if (defined $file_name) {
6975                         if ($have_blame) {
6976                                 $formats_nav .=
6977                                         $cgi->a({-href => href(action=>"blame", -replay=>1)},
6978                                                 "blame") .
6979                                         " | ";
6980                         }
6981                         $formats_nav .=
6982                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6983                                         "history") .
6984                                 " | " .
6985                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6986                                         "raw") .
6987                                 " | " .
6988                                 $cgi->a({-href => href(action=>"blob",
6989                                                        hash_base=>"HEAD", file_name=>$file_name)},
6990                                         "HEAD");
6991                 } else {
6992                         $formats_nav .=
6993                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6994                                         "raw");
6995                 }
6996                 git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6997                 git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6998         } else {
6999                 print "<div class=\"page_nav\">\n" .
7000                       "<br/><br/></div>\n" .
7001                       "<div class=\"title\">".esc_html($hash)."</div>\n";
7002         }
7003         git_print_page_path($file_name, "blob", $hash_base);
7004         print "<div class=\"page_body\">\n";
7005         if ($mimetype =~ m!^image/!) {
7006                 print qq!<img type="!.esc_attr($mimetype).qq!"!;
7007                 if ($file_name) {
7008                         print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
7009                 }
7010                 print qq! src="! .
7011                       href(action=>"blob_plain", hash=>$hash,
7012                            hash_base=>$hash_base, file_name=>$file_name) .
7013                       qq!" />\n!;
7014         } else {
7015                 my $nr;
7016                 while (my $line = <$fd>) {
7017                         chomp $line;
7018                         $nr++;
7019                         $line = untabify($line);
7020                         printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
7021                                $nr, esc_attr(href(-replay => 1)), $nr, $nr,
7022                                $syntax ? sanitize($line) : esc_html($line, -nbsp=>1);
7023                 }
7024         }
7025         close $fd
7026                 or print "Reading blob failed.\n";
7027         print "</div>";
7028         git_footer_html();
7029 }
7030
7031 sub git_tree {
7032         if (!defined $hash_base) {
7033                 $hash_base = "HEAD";
7034         }
7035         if (!defined $hash) {
7036                 if (defined $file_name) {
7037                         $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
7038                 } else {
7039                         $hash = $hash_base;
7040                 }
7041         }
7042         die_error(404, "No such tree") unless defined($hash);
7043
7044         my $show_sizes = gitweb_check_feature('show-sizes');
7045         my $have_blame = gitweb_check_feature('blame');
7046
7047         my @entries = ();
7048         {
7049                 local $/ = "\0";
7050                 open my $fd, "-|", git_cmd(), "ls-tree", '-z',
7051                         ($show_sizes ? '-l' : ()), @extra_options, $hash
7052                         or die_error(500, "Open git-ls-tree failed");
7053                 @entries = map { chomp; $_ } <$fd>;
7054                 close $fd
7055                         or die_error(404, "Reading tree failed");
7056         }
7057
7058         my $refs = git_get_references();
7059         my $ref = format_ref_marker($refs, $hash_base);
7060         git_header_html();
7061         my $basedir = '';
7062         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7063                 my @views_nav = ();
7064                 if (defined $file_name) {
7065                         push @views_nav,
7066                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
7067                                         "history"),
7068                                 $cgi->a({-href => href(action=>"tree",
7069                                                        hash_base=>"HEAD", file_name=>$file_name)},
7070                                         "HEAD"),
7071                 }
7072                 my $snapshot_links = format_snapshot_links($hash);
7073                 if (defined $snapshot_links) {
7074                         # FIXME: Should be available when we have no hash base as well.
7075                         push @views_nav, $snapshot_links;
7076                 }
7077                 git_print_page_nav('tree','', $hash_base, undef, undef,
7078                                    join(' | ', @views_nav));
7079                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
7080         } else {
7081                 undef $hash_base;
7082                 print "<div class=\"page_nav\">\n";
7083                 print "<br/><br/></div>\n";
7084                 print "<div class=\"title\">".esc_html($hash)."</div>\n";
7085         }
7086         if (defined $file_name) {
7087                 $basedir = $file_name;
7088                 if ($basedir ne '' && substr($basedir, -1) ne '/') {
7089                         $basedir .= '/';
7090                 }
7091                 git_print_page_path($file_name, 'tree', $hash_base);
7092         }
7093         print "<div class=\"page_body\">\n";
7094         print "<table class=\"tree\">\n";
7095         my $alternate = 1;
7096         # '..' (top directory) link if possible
7097         if (defined $hash_base &&
7098             defined $file_name && $file_name =~ m![^/]+$!) {
7099                 if ($alternate) {
7100                         print "<tr class=\"dark\">\n";
7101                 } else {
7102                         print "<tr class=\"light\">\n";
7103                 }
7104                 $alternate ^= 1;
7105
7106                 my $up = $file_name;
7107                 $up =~ s!/?[^/]+$!!;
7108                 undef $up unless $up;
7109                 # based on git_print_tree_entry
7110                 print '<td class="mode">' . mode_str('040000') . "</td>\n";
7111                 print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
7112                 print '<td class="list">';
7113                 print $cgi->a({-href => href(action=>"tree",
7114                                              hash_base=>$hash_base,
7115                                              file_name=>$up)},
7116                               "..");
7117                 print "</td>\n";
7118                 print "<td class=\"link\"></td>\n";
7119
7120                 print "</tr>\n";
7121         }
7122         foreach my $line (@entries) {
7123                 my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
7124
7125                 if ($alternate) {
7126                         print "<tr class=\"dark\">\n";
7127                 } else {
7128                         print "<tr class=\"light\">\n";
7129                 }
7130                 $alternate ^= 1;
7131
7132                 git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
7133
7134                 print "</tr>\n";
7135         }
7136         print "</table>\n" .
7137               "</div>";
7138         git_footer_html();
7139 }
7140
7141 sub snapshot_name {
7142         my ($project, $hash) = @_;
7143
7144         # path/to/project.git  -> project
7145         # path/to/project/.git -> project
7146         my $name = to_utf8($project);
7147         $name =~ s,([^/])/*\.git$,$1,;
7148         $name = basename($name);
7149         # sanitize name
7150         $name =~ s/[[:cntrl:]]/?/g;
7151
7152         my $ver = $hash;
7153         if ($hash =~ /^[0-9a-fA-F]+$/) {
7154                 # shorten SHA-1 hash
7155                 my $full_hash = git_get_full_hash($project, $hash);
7156                 if ($full_hash =~ /^$hash/ && length($hash) > 7) {
7157                         $ver = git_get_short_hash($project, $hash);
7158                 }
7159         } elsif ($hash =~ m!^refs/tags/(.*)$!) {
7160                 # tags don't need shortened SHA-1 hash
7161                 $ver = $1;
7162         } else {
7163                 # branches and other need shortened SHA-1 hash
7164                 if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
7165                         $ver = $1;
7166                 }
7167                 $ver .= '-' . git_get_short_hash($project, $hash);
7168         }
7169         # in case of hierarchical branch names
7170         $ver =~ s!/!.!g;
7171
7172         # name = project-version_string
7173         $name = "$name-$ver";
7174
7175         return wantarray ? ($name, $name) : $name;
7176 }
7177
7178 sub exit_if_unmodified_since {
7179         my ($latest_epoch) = @_;
7180         our $cgi;
7181
7182         my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7183         if (defined $if_modified) {
7184                 my $since;
7185                 if (eval { require HTTP::Date; 1; }) {
7186                         $since = HTTP::Date::str2time($if_modified);
7187                 } elsif (eval { require Time::ParseDate; 1; }) {
7188                         $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7189                 }
7190                 if (defined $since && $latest_epoch <= $since) {
7191                         my %latest_date = parse_date($latest_epoch);
7192                         print $cgi->header(
7193                                 -last_modified => $latest_date{'rfc2822'},
7194                                 -status => '304 Not Modified');
7195                         goto DONE_GITWEB;
7196                 }
7197         }
7198 }
7199
7200 sub git_snapshot {
7201         my $format = $input_params{'snapshot_format'};
7202         if (!@snapshot_fmts) {
7203                 die_error(403, "Snapshots not allowed");
7204         }
7205         # default to first supported snapshot format
7206         $format ||= $snapshot_fmts[0];
7207         if ($format !~ m/^[a-z0-9]+$/) {
7208                 die_error(400, "Invalid snapshot format parameter");
7209         } elsif (!exists($known_snapshot_formats{$format})) {
7210                 die_error(400, "Unknown snapshot format");
7211         } elsif ($known_snapshot_formats{$format}{'disabled'}) {
7212                 die_error(403, "Snapshot format not allowed");
7213         } elsif (!grep($_ eq $format, @snapshot_fmts)) {
7214                 die_error(403, "Unsupported snapshot format");
7215         }
7216
7217         my $type = git_get_type("$hash^{}");
7218         if (!$type) {
7219                 die_error(404, 'Object does not exist');
7220         }  elsif ($type eq 'blob') {
7221                 die_error(400, 'Object is not a tree-ish');
7222         }
7223
7224         my ($name, $prefix) = snapshot_name($project, $hash);
7225         my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
7226
7227         my %co = parse_commit($hash);
7228         exit_if_unmodified_since($co{'committer_epoch'}) if %co;
7229
7230         my $cmd = quote_command(
7231                 git_cmd(), 'archive',
7232                 "--format=$known_snapshot_formats{$format}{'format'}",
7233                 "--prefix=$prefix/", $hash);
7234         if (exists $known_snapshot_formats{$format}{'compressor'}) {
7235                 $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
7236         }
7237
7238         $filename =~ s/(["\\])/\\$1/g;
7239         my %latest_date;
7240         if (%co) {
7241                 %latest_date = parse_date($co{'committer_epoch'}, $co{'committer_tz'});
7242         }
7243
7244         print $cgi->header(
7245                 -type => $known_snapshot_formats{$format}{'type'},
7246                 -content_disposition => 'inline; filename="' . $filename . '"',
7247                 %co ? (-last_modified => $latest_date{'rfc2822'}) : (),
7248                 -status => '200 OK');
7249
7250         open my $fd, "-|", $cmd
7251                 or die_error(500, "Execute git-archive failed");
7252         binmode STDOUT, ':raw';
7253         print <$fd>;
7254         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
7255         close $fd;
7256 }
7257
7258 sub git_log_generic {
7259         my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
7260
7261         my $head = git_get_head_hash($project);
7262         if (!defined $base) {
7263                 $base = $head;
7264         }
7265         if (!defined $page) {
7266                 $page = 0;
7267         }
7268         my $refs = git_get_references();
7269
7270         my $commit_hash = $base;
7271         if (defined $parent) {
7272                 $commit_hash = "$parent..$base";
7273         }
7274         my @commitlist =
7275                 parse_commits($commit_hash, 101, (100 * $page),
7276                               defined $file_name ? ($file_name, "--full-history") : ());
7277
7278         my $ftype;
7279         if (!defined $file_hash && defined $file_name) {
7280                 # some commits could have deleted file in question,
7281                 # and not have it in tree, but one of them has to have it
7282                 for (my $i = 0; $i < @commitlist; $i++) {
7283                         $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
7284                         last if defined $file_hash;
7285                 }
7286         }
7287         if (defined $file_hash) {
7288                 $ftype = git_get_type($file_hash);
7289         }
7290         if (defined $file_name && !defined $ftype) {
7291                 die_error(500, "Unknown type of object");
7292         }
7293         my %co;
7294         if (defined $file_name) {
7295                 %co = parse_commit($base)
7296                         or die_error(404, "Unknown commit object");
7297         }
7298
7299
7300         my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
7301         my $next_link = '';
7302         if ($#commitlist >= 100) {
7303                 $next_link =
7304                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
7305                                  -accesskey => "n", -title => "Alt-n"}, "next");
7306         }
7307         my $patch_max = gitweb_get_feature('patches');
7308         if ($patch_max && !defined $file_name) {
7309                 if ($patch_max < 0 || @commitlist <= $patch_max) {
7310                         $paging_nav .= " &sdot; " .
7311                                 $cgi->a({-href => href(action=>"patches", -replay=>1)},
7312                                         "patches");
7313                 }
7314         }
7315
7316         git_header_html();
7317         git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
7318         if (defined $file_name) {
7319                 git_print_header_div('commit', esc_html($co{'title'}), $base);
7320         } else {
7321                 git_print_header_div('summary', $project)
7322         }
7323         git_print_page_path($file_name, $ftype, $hash_base)
7324                 if (defined $file_name);
7325
7326         $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
7327                      $file_name, $file_hash, $ftype);
7328
7329         git_footer_html();
7330 }
7331
7332 sub git_log {
7333         git_log_generic('log', \&git_log_body,
7334                         $hash, $hash_parent);
7335 }
7336
7337 sub git_commit {
7338         $hash ||= $hash_base || "HEAD";
7339         my %co = parse_commit($hash)
7340             or die_error(404, "Unknown commit object");
7341
7342         my $parent  = $co{'parent'};
7343         my $parents = $co{'parents'}; # listref
7344
7345         # we need to prepare $formats_nav before any parameter munging
7346         my $formats_nav;
7347         if (!defined $parent) {
7348                 # --root commitdiff
7349                 $formats_nav .= '(initial)';
7350         } elsif (@$parents == 1) {
7351                 # single parent commit
7352                 $formats_nav .=
7353                         '(parent: ' .
7354                         $cgi->a({-href => href(action=>"commit",
7355                                                hash=>$parent)},
7356                                 esc_html(substr($parent, 0, 7))) .
7357                         ')';
7358         } else {
7359                 # merge commit
7360                 $formats_nav .=
7361                         '(merge: ' .
7362                         join(' ', map {
7363                                 $cgi->a({-href => href(action=>"commit",
7364                                                        hash=>$_)},
7365                                         esc_html(substr($_, 0, 7)));
7366                         } @$parents ) .
7367                         ')';
7368         }
7369         if (gitweb_check_feature('patches') && @$parents <= 1) {
7370                 $formats_nav .= " | " .
7371                         $cgi->a({-href => href(action=>"patch", -replay=>1)},
7372                                 "patch");
7373         }
7374
7375         if (!defined $parent) {
7376                 $parent = "--root";
7377         }
7378         my @difftree;
7379         open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
7380                 @diff_opts,
7381                 (@$parents <= 1 ? $parent : '-c'),
7382                 $hash, "--"
7383                 or die_error(500, "Open git-diff-tree failed");
7384         @difftree = map { chomp; $_ } <$fd>;
7385         close $fd or die_error(404, "Reading git-diff-tree failed");
7386
7387         # non-textual hash id's can be cached
7388         my $expires;
7389         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7390                 $expires = "+1d";
7391         }
7392         my $refs = git_get_references();
7393         my $ref = format_ref_marker($refs, $co{'id'});
7394
7395         git_header_html(undef, $expires);
7396         git_print_page_nav('commit', '',
7397                            $hash, $co{'tree'}, $hash,
7398                            $formats_nav);
7399
7400         if (defined $co{'parent'}) {
7401                 git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
7402         } else {
7403                 git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
7404         }
7405         print "<div class=\"title_text\">\n" .
7406               "<table class=\"object_header\">\n";
7407         git_print_authorship_rows(\%co);
7408         print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
7409         print "<tr>" .
7410               "<td>tree</td>" .
7411               "<td class=\"sha1\">" .
7412               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7413                        class => "list"}, $co{'tree'}) .
7414               "</td>" .
7415               "<td class=\"link\">" .
7416               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7417                       "tree");
7418         my $snapshot_links = format_snapshot_links($hash);
7419         if (defined $snapshot_links) {
7420                 print " | " . $snapshot_links;
7421         }
7422         print "</td>" .
7423               "</tr>\n";
7424
7425         foreach my $par (@$parents) {
7426                 print "<tr>" .
7427                       "<td>parent</td>" .
7428                       "<td class=\"sha1\">" .
7429                       $cgi->a({-href => href(action=>"commit", hash=>$par),
7430                                class => "list"}, $par) .
7431                       "</td>" .
7432                       "<td class=\"link\">" .
7433                       $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7434                       " | " .
7435                       $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7436                       "</td>" .
7437                       "</tr>\n";
7438         }
7439         print "</table>".
7440               "</div>\n";
7441
7442         print "<div class=\"page_body\">\n";
7443         git_print_log($co{'comment'});
7444         print "</div>\n";
7445
7446         git_difftree_body(\@difftree, $hash, @$parents);
7447
7448         git_footer_html();
7449 }
7450
7451 sub git_object {
7452         # object is defined by:
7453         # - hash or hash_base alone
7454         # - hash_base and file_name
7455         my $type;
7456
7457         # - hash or hash_base alone
7458         if ($hash || ($hash_base && !defined $file_name)) {
7459                 my $object_id = $hash || $hash_base;
7460
7461                 open my $fd, "-|", quote_command(
7462                         git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7463                         or die_error(404, "Object does not exist");
7464                 $type = <$fd>;
7465                 chomp $type;
7466                 close $fd
7467                         or die_error(404, "Object does not exist");
7468
7469         # - hash_base and file_name
7470         } elsif ($hash_base && defined $file_name) {
7471                 $file_name =~ s,/+$,,;
7472
7473                 system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7474                         or die_error(404, "Base object does not exist");
7475
7476                 # here errors should not hapen
7477                 open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7478                         or die_error(500, "Open git-ls-tree failed");
7479                 my $line = <$fd>;
7480                 close $fd;
7481
7482                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7483                 unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7484                         die_error(404, "File or directory for given base does not exist");
7485                 }
7486                 $type = $2;
7487                 $hash = $3;
7488         } else {
7489                 die_error(400, "Not enough information to find object");
7490         }
7491
7492         print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7493                                           hash=>$hash, hash_base=>$hash_base,
7494                                           file_name=>$file_name),
7495                              -status => '302 Found');
7496 }
7497
7498 sub git_blobdiff {
7499         my $format = shift || 'html';
7500         my $diff_style = $input_params{'diff_style'} || 'inline';
7501
7502         my $fd;
7503         my @difftree;
7504         my %diffinfo;
7505         my $expires;
7506
7507         # preparing $fd and %diffinfo for git_patchset_body
7508         # new style URI
7509         if (defined $hash_base && defined $hash_parent_base) {
7510                 if (defined $file_name) {
7511                         # read raw output
7512                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7513                                 $hash_parent_base, $hash_base,
7514                                 "--", (defined $file_parent ? $file_parent : ()), $file_name
7515                                 or die_error(500, "Open git-diff-tree failed");
7516                         @difftree = map { chomp; $_ } <$fd>;
7517                         close $fd
7518                                 or die_error(404, "Reading git-diff-tree failed");
7519                         @difftree
7520                                 or die_error(404, "Blob diff not found");
7521
7522                 } elsif (defined $hash &&
7523                          $hash =~ /[0-9a-fA-F]{40}/) {
7524                         # try to find filename from $hash
7525
7526                         # read filtered raw output
7527                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7528                                 $hash_parent_base, $hash_base, "--"
7529                                 or die_error(500, "Open git-diff-tree failed");
7530                         @difftree =
7531                                 # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7532                                 # $hash == to_id
7533                                 grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7534                                 map { chomp; $_ } <$fd>;
7535                         close $fd
7536                                 or die_error(404, "Reading git-diff-tree failed");
7537                         @difftree
7538                                 or die_error(404, "Blob diff not found");
7539
7540                 } else {
7541                         die_error(400, "Missing one of the blob diff parameters");
7542                 }
7543
7544                 if (@difftree > 1) {
7545                         die_error(400, "Ambiguous blob diff specification");
7546                 }
7547
7548                 %diffinfo = parse_difftree_raw_line($difftree[0]);
7549                 $file_parent ||= $diffinfo{'from_file'} || $file_name;
7550                 $file_name   ||= $diffinfo{'to_file'};
7551
7552                 $hash_parent ||= $diffinfo{'from_id'};
7553                 $hash        ||= $diffinfo{'to_id'};
7554
7555                 # non-textual hash id's can be cached
7556                 if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7557                     $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7558                         $expires = '+1d';
7559                 }
7560
7561                 # open patch output
7562                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7563                         '-p', ($format eq 'html' ? "--full-index" : ()),
7564                         $hash_parent_base, $hash_base,
7565                         "--", (defined $file_parent ? $file_parent : ()), $file_name
7566                         or die_error(500, "Open git-diff-tree failed");
7567         }
7568
7569         # old/legacy style URI -- not generated anymore since 1.4.3.
7570         if (!%diffinfo) {
7571                 die_error('404 Not Found', "Missing one of the blob diff parameters")
7572         }
7573
7574         # header
7575         if ($format eq 'html') {
7576                 my $formats_nav =
7577                         $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7578                                 "raw");
7579                 $formats_nav .= diff_style_nav($diff_style);
7580                 git_header_html(undef, $expires);
7581                 if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7582                         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7583                         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7584                 } else {
7585                         print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7586                         print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7587                 }
7588                 if (defined $file_name) {
7589                         git_print_page_path($file_name, "blob", $hash_base);
7590                 } else {
7591                         print "<div class=\"page_path\"></div>\n";
7592                 }
7593
7594         } elsif ($format eq 'plain') {
7595                 print $cgi->header(
7596                         -type => 'text/plain',
7597                         -charset => 'utf-8',
7598                         -expires => $expires,
7599                         -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7600
7601                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7602
7603         } else {
7604                 die_error(400, "Unknown blobdiff format");
7605         }
7606
7607         # patch
7608         if ($format eq 'html') {
7609                 print "<div class=\"page_body\">\n";
7610
7611                 git_patchset_body($fd, $diff_style,
7612                                   [ \%diffinfo ], $hash_base, $hash_parent_base);
7613                 close $fd;
7614
7615                 print "</div>\n"; # class="page_body"
7616                 git_footer_html();
7617
7618         } else {
7619                 while (my $line = <$fd>) {
7620                         $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7621                         $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7622
7623                         print $line;
7624
7625                         last if $line =~ m!^\+\+\+!;
7626                 }
7627                 local $/ = undef;
7628                 print <$fd>;
7629                 close $fd;
7630         }
7631 }
7632
7633 sub git_blobdiff_plain {
7634         git_blobdiff('plain');
7635 }
7636
7637 # assumes that it is added as later part of already existing navigation,
7638 # so it returns "| foo | bar" rather than just "foo | bar"
7639 sub diff_style_nav {
7640         my ($diff_style, $is_combined) = @_;
7641         $diff_style ||= 'inline';
7642
7643         return "" if ($is_combined);
7644
7645         my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7646         my %styles = @styles;
7647         @styles =
7648                 @styles[ map { $_ * 2 } 0..$#styles/2 ];
7649
7650         return join '',
7651                 map { " | ".$_ }
7652                 map {
7653                         $_ eq $diff_style ? $styles{$_} :
7654                         $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7655                 } @styles;
7656 }
7657
7658 sub git_commitdiff {
7659         my %params = @_;
7660         my $format = $params{-format} || 'html';
7661         my $diff_style = $input_params{'diff_style'} || 'inline';
7662
7663         my ($patch_max) = gitweb_get_feature('patches');
7664         if ($format eq 'patch') {
7665                 die_error(403, "Patch view not allowed") unless $patch_max;
7666         }
7667
7668         $hash ||= $hash_base || "HEAD";
7669         my %co = parse_commit($hash)
7670             or die_error(404, "Unknown commit object");
7671
7672         # choose format for commitdiff for merge
7673         if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7674                 $hash_parent = '--cc';
7675         }
7676         # we need to prepare $formats_nav before almost any parameter munging
7677         my $formats_nav;
7678         if ($format eq 'html') {
7679                 $formats_nav =
7680                         $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7681                                 "raw");
7682                 if ($patch_max && @{$co{'parents'}} <= 1) {
7683                         $formats_nav .= " | " .
7684                                 $cgi->a({-href => href(action=>"patch", -replay=>1)},
7685                                         "patch");
7686                 }
7687                 $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7688
7689                 if (defined $hash_parent &&
7690                     $hash_parent ne '-c' && $hash_parent ne '--cc') {
7691                         # commitdiff with two commits given
7692                         my $hash_parent_short = $hash_parent;
7693                         if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7694                                 $hash_parent_short = substr($hash_parent, 0, 7);
7695                         }
7696                         $formats_nav .=
7697                                 ' (from';
7698                         for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7699                                 if ($co{'parents'}[$i] eq $hash_parent) {
7700                                         $formats_nav .= ' parent ' . ($i+1);
7701                                         last;
7702                                 }
7703                         }
7704                         $formats_nav .= ': ' .
7705                                 $cgi->a({-href => href(-replay=>1,
7706                                                        hash=>$hash_parent, hash_base=>undef)},
7707                                         esc_html($hash_parent_short)) .
7708                                 ')';
7709                 } elsif (!$co{'parent'}) {
7710                         # --root commitdiff
7711                         $formats_nav .= ' (initial)';
7712                 } elsif (scalar @{$co{'parents'}} == 1) {
7713                         # single parent commit
7714                         $formats_nav .=
7715                                 ' (parent: ' .
7716                                 $cgi->a({-href => href(-replay=>1,
7717                                                        hash=>$co{'parent'}, hash_base=>undef)},
7718                                         esc_html(substr($co{'parent'}, 0, 7))) .
7719                                 ')';
7720                 } else {
7721                         # merge commit
7722                         if ($hash_parent eq '--cc') {
7723                                 $formats_nav .= ' | ' .
7724                                         $cgi->a({-href => href(-replay=>1,
7725                                                                hash=>$hash, hash_parent=>'-c')},
7726                                                 'combined');
7727                         } else { # $hash_parent eq '-c'
7728                                 $formats_nav .= ' | ' .
7729                                         $cgi->a({-href => href(-replay=>1,
7730                                                                hash=>$hash, hash_parent=>'--cc')},
7731                                                 'compact');
7732                         }
7733                         $formats_nav .=
7734                                 ' (merge: ' .
7735                                 join(' ', map {
7736                                         $cgi->a({-href => href(-replay=>1,
7737                                                                hash=>$_, hash_base=>undef)},
7738                                                 esc_html(substr($_, 0, 7)));
7739                                 } @{$co{'parents'}} ) .
7740                                 ')';
7741                 }
7742         }
7743
7744         my $hash_parent_param = $hash_parent;
7745         if (!defined $hash_parent_param) {
7746                 # --cc for multiple parents, --root for parentless
7747                 $hash_parent_param =
7748                         @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7749         }
7750
7751         # read commitdiff
7752         my $fd;
7753         my @difftree;
7754         if ($format eq 'html') {
7755                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7756                         "--no-commit-id", "--patch-with-raw", "--full-index",
7757                         $hash_parent_param, $hash, "--"
7758                         or die_error(500, "Open git-diff-tree failed");
7759
7760                 while (my $line = <$fd>) {
7761                         chomp $line;
7762                         # empty line ends raw part of diff-tree output
7763                         last unless $line;
7764                         push @difftree, scalar parse_difftree_raw_line($line);
7765                 }
7766
7767         } elsif ($format eq 'plain') {
7768                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7769                         '-p', $hash_parent_param, $hash, "--"
7770                         or die_error(500, "Open git-diff-tree failed");
7771         } elsif ($format eq 'patch') {
7772                 # For commit ranges, we limit the output to the number of
7773                 # patches specified in the 'patches' feature.
7774                 # For single commits, we limit the output to a single patch,
7775                 # diverging from the git-format-patch default.
7776                 my @commit_spec = ();
7777                 if ($hash_parent) {
7778                         if ($patch_max > 0) {
7779                                 push @commit_spec, "-$patch_max";
7780                         }
7781                         push @commit_spec, '-n', "$hash_parent..$hash";
7782                 } else {
7783                         if ($params{-single}) {
7784                                 push @commit_spec, '-1';
7785                         } else {
7786                                 if ($patch_max > 0) {
7787                                         push @commit_spec, "-$patch_max";
7788                                 }
7789                                 push @commit_spec, "-n";
7790                         }
7791                         push @commit_spec, '--root', $hash;
7792                 }
7793                 open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7794                         '--encoding=utf8', '--stdout', @commit_spec
7795                         or die_error(500, "Open git-format-patch failed");
7796         } else {
7797                 die_error(400, "Unknown commitdiff format");
7798         }
7799
7800         # non-textual hash id's can be cached
7801         my $expires;
7802         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7803                 $expires = "+1d";
7804         }
7805
7806         # write commit message
7807         if ($format eq 'html') {
7808                 my $refs = git_get_references();
7809                 my $ref = format_ref_marker($refs, $co{'id'});
7810
7811                 git_header_html(undef, $expires);
7812                 git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7813                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7814                 print "<div class=\"title_text\">\n" .
7815                       "<table class=\"object_header\">\n";
7816                 git_print_authorship_rows(\%co);
7817                 print "</table>".
7818                       "</div>\n";
7819                 print "<div class=\"page_body\">\n";
7820                 if (@{$co{'comment'}} > 1) {
7821                         print "<div class=\"log\">\n";
7822                         git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7823                         print "</div>\n"; # class="log"
7824                 }
7825
7826         } elsif ($format eq 'plain') {
7827                 my $refs = git_get_references("tags");
7828                 my $tagname = git_get_rev_name_tags($hash);
7829                 my $filename = basename($project) . "-$hash.patch";
7830
7831                 print $cgi->header(
7832                         -type => 'text/plain',
7833                         -charset => 'utf-8',
7834                         -expires => $expires,
7835                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7836                 my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7837                 print "From: " . to_utf8($co{'author'}) . "\n";
7838                 print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7839                 print "Subject: " . to_utf8($co{'title'}) . "\n";
7840
7841                 print "X-Git-Tag: $tagname\n" if $tagname;
7842                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7843
7844                 foreach my $line (@{$co{'comment'}}) {
7845                         print to_utf8($line) . "\n";
7846                 }
7847                 print "---\n\n";
7848         } elsif ($format eq 'patch') {
7849                 my $filename = basename($project) . "-$hash.patch";
7850
7851                 print $cgi->header(
7852                         -type => 'text/plain',
7853                         -charset => 'utf-8',
7854                         -expires => $expires,
7855                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7856         }
7857
7858         # write patch
7859         if ($format eq 'html') {
7860                 my $use_parents = !defined $hash_parent ||
7861                         $hash_parent eq '-c' || $hash_parent eq '--cc';
7862                 git_difftree_body(\@difftree, $hash,
7863                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7864                 print "<br/>\n";
7865
7866                 git_patchset_body($fd, $diff_style,
7867                                   \@difftree, $hash,
7868                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7869                 close $fd;
7870                 print "</div>\n"; # class="page_body"
7871                 git_footer_html();
7872
7873         } elsif ($format eq 'plain') {
7874                 local $/ = undef;
7875                 print <$fd>;
7876                 close $fd
7877                         or print "Reading git-diff-tree failed\n";
7878         } elsif ($format eq 'patch') {
7879                 local $/ = undef;
7880                 print <$fd>;
7881                 close $fd
7882                         or print "Reading git-format-patch failed\n";
7883         }
7884 }
7885
7886 sub git_commitdiff_plain {
7887         git_commitdiff(-format => 'plain');
7888 }
7889
7890 # format-patch-style patches
7891 sub git_patch {
7892         git_commitdiff(-format => 'patch', -single => 1);
7893 }
7894
7895 sub git_patches {
7896         git_commitdiff(-format => 'patch');
7897 }
7898
7899 sub git_history {
7900         git_log_generic('history', \&git_history_body,
7901                         $hash_base, $hash_parent_base,
7902                         $file_name, $hash);
7903 }
7904
7905 sub git_search {
7906         $searchtype ||= 'commit';
7907
7908         # check if appropriate features are enabled
7909         gitweb_check_feature('search')
7910                 or die_error(403, "Search is disabled");
7911         if ($searchtype eq 'pickaxe') {
7912                 # pickaxe may take all resources of your box and run for several minutes
7913                 # with every query - so decide by yourself how public you make this feature
7914                 gitweb_check_feature('pickaxe')
7915                         or die_error(403, "Pickaxe search is disabled");
7916         }
7917         if ($searchtype eq 'grep') {
7918                 # grep search might be potentially CPU-intensive, too
7919                 gitweb_check_feature('grep')
7920                         or die_error(403, "Grep search is disabled");
7921         }
7922
7923         if (!defined $searchtext) {
7924                 die_error(400, "Text field is empty");
7925         }
7926         if (!defined $hash) {
7927                 $hash = git_get_head_hash($project);
7928         }
7929         my %co = parse_commit($hash);
7930         if (!%co) {
7931                 die_error(404, "Unknown commit object");
7932         }
7933         if (!defined $page) {
7934                 $page = 0;
7935         }
7936
7937         if ($searchtype eq 'commit' ||
7938             $searchtype eq 'author' ||
7939             $searchtype eq 'committer') {
7940                 git_search_message(%co);
7941         } elsif ($searchtype eq 'pickaxe') {
7942                 git_search_changes(%co);
7943         } elsif ($searchtype eq 'grep') {
7944                 git_search_files(%co);
7945         } else {
7946                 die_error(400, "Unknown search type");
7947         }
7948 }
7949
7950 sub git_search_help {
7951         git_header_html();
7952         git_print_page_nav('','', $hash,$hash,$hash);
7953         print <<EOT;
7954 <p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7955 regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7956 the pattern entered is recognized as the POSIX extended
7957 <a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7958 insensitive).</p>
7959 <dl>
7960 <dt><b>commit</b></dt>
7961 <dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7962 EOT
7963         my $have_grep = gitweb_check_feature('grep');
7964         if ($have_grep) {
7965                 print <<EOT;
7966 <dt><b>grep</b></dt>
7967 <dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7968     a different one) are searched for the given pattern. On large trees, this search can take
7969 a while and put some strain on the server, so please use it with some consideration. Note that
7970 due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7971 case-sensitive.</dd>
7972 EOT
7973         }
7974         print <<EOT;
7975 <dt><b>author</b></dt>
7976 <dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7977 <dt><b>committer</b></dt>
7978 <dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7979 EOT
7980         my $have_pickaxe = gitweb_check_feature('pickaxe');
7981         if ($have_pickaxe) {
7982                 print <<EOT;
7983 <dt><b>pickaxe</b></dt>
7984 <dd>All commits that caused the string to appear or disappear from any file (changes that
7985 added, removed or "modified" the string) will be listed. This search can take a while and
7986 takes a lot of strain on the server, so please use it wisely. Note that since you may be
7987 interested even in changes just changing the case as well, this search is case sensitive.</dd>
7988 EOT
7989         }
7990         print "</dl>\n";
7991         git_footer_html();
7992 }
7993
7994 sub git_shortlog {
7995         git_log_generic('shortlog', \&git_shortlog_body,
7996                         $hash, $hash_parent);
7997 }
7998
7999 ## ......................................................................
8000 ## feeds (RSS, Atom; OPML)
8001
8002 sub git_feed {
8003         my $format = shift || 'atom';
8004         my $have_blame = gitweb_check_feature('blame');
8005
8006         # Atom: http://www.atomenabled.org/developers/syndication/
8007         # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
8008         if ($format ne 'rss' && $format ne 'atom') {
8009                 die_error(400, "Unknown web feed format");
8010         }
8011
8012         # log/feed of current (HEAD) branch, log of given branch, history of file/directory
8013         my $head = $hash || 'HEAD';
8014         my @commitlist = parse_commits($head, 150, 0, $file_name);
8015
8016         my %latest_commit;
8017         my %latest_date;
8018         my $content_type = "application/$format+xml";
8019         if (defined $cgi->http('HTTP_ACCEPT') &&
8020                  $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
8021                 # browser (feed reader) prefers text/xml
8022                 $content_type = 'text/xml';
8023         }
8024         if (defined($commitlist[0])) {
8025                 %latest_commit = %{$commitlist[0]};
8026                 my $latest_epoch = $latest_commit{'committer_epoch'};
8027                 exit_if_unmodified_since($latest_epoch);
8028                 %latest_date = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
8029         }
8030         print $cgi->header(
8031                 -type => $content_type,
8032                 -charset => 'utf-8',
8033                 %latest_date ? (-last_modified => $latest_date{'rfc2822'}) : (),
8034                 -status => '200 OK');
8035
8036         # Optimization: skip generating the body if client asks only
8037         # for Last-Modified date.
8038         return if ($cgi->request_method() eq 'HEAD');
8039
8040         # header variables
8041         my $title = "$site_name - $project/$action";
8042         my $feed_type = 'log';
8043         if (defined $hash) {
8044                 $title .= " - '$hash'";
8045                 $feed_type = 'branch log';
8046                 if (defined $file_name) {
8047                         $title .= " :: $file_name";
8048                         $feed_type = 'history';
8049                 }
8050         } elsif (defined $file_name) {
8051                 $title .= " - $file_name";
8052                 $feed_type = 'history';
8053         }
8054         $title .= " $feed_type";
8055         my $descr = git_get_project_description($project);
8056         if (defined $descr) {
8057                 $descr = esc_html($descr);
8058         } else {
8059                 $descr = "$project " .
8060                          ($format eq 'rss' ? 'RSS' : 'Atom') .
8061                          " feed";
8062         }
8063         my $owner = git_get_project_owner($project);
8064         $owner = esc_html($owner);
8065
8066         #header
8067         my $alt_url;
8068         if (defined $file_name) {
8069                 $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
8070         } elsif (defined $hash) {
8071                 $alt_url = href(-full=>1, action=>"log", hash=>$hash);
8072         } else {
8073                 $alt_url = href(-full=>1, action=>"summary");
8074         }
8075         print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
8076         if ($format eq 'rss') {
8077                 print <<XML;
8078 <rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
8079 <channel>
8080 XML
8081                 print "<title>$title</title>\n" .
8082                       "<link>$alt_url</link>\n" .
8083                       "<description>$descr</description>\n" .
8084                       "<language>en</language>\n" .
8085                       # project owner is responsible for 'editorial' content
8086                       "<managingEditor>$owner</managingEditor>\n";
8087                 if (defined $logo || defined $favicon) {
8088                         # prefer the logo to the favicon, since RSS
8089                         # doesn't allow both
8090                         my $img = esc_url($logo || $favicon);
8091                         print "<image>\n" .
8092                               "<url>$img</url>\n" .
8093                               "<title>$title</title>\n" .
8094                               "<link>$alt_url</link>\n" .
8095                               "</image>\n";
8096                 }
8097                 if (%latest_date) {
8098                         print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
8099                         print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
8100                 }
8101                 print "<generator>gitweb v.$version/$git_version</generator>\n";
8102         } elsif ($format eq 'atom') {
8103                 print <<XML;
8104 <feed xmlns="http://www.w3.org/2005/Atom">
8105 XML
8106                 print "<title>$title</title>\n" .
8107                       "<subtitle>$descr</subtitle>\n" .
8108                       '<link rel="alternate" type="text/html" href="' .
8109                       $alt_url . '" />' . "\n" .
8110                       '<link rel="self" type="' . $content_type . '" href="' .
8111                       $cgi->self_url() . '" />' . "\n" .
8112                       "<id>" . href(-full=>1) . "</id>\n" .
8113                       # use project owner for feed author
8114                       "<author><name>$owner</name></author>\n";
8115                 if (defined $favicon) {
8116                         print "<icon>" . esc_url($favicon) . "</icon>\n";
8117                 }
8118                 if (defined $logo) {
8119                         # not twice as wide as tall: 72 x 27 pixels
8120                         print "<logo>" . esc_url($logo) . "</logo>\n";
8121                 }
8122                 if (! %latest_date) {
8123                         # dummy date to keep the feed valid until commits trickle in:
8124                         print "<updated>1970-01-01T00:00:00Z</updated>\n";
8125                 } else {
8126                         print "<updated>$latest_date{'iso-8601'}</updated>\n";
8127                 }
8128                 print "<generator version='$version/$git_version'>gitweb</generator>\n";
8129         }
8130
8131         # contents
8132         for (my $i = 0; $i <= $#commitlist; $i++) {
8133                 my %co = %{$commitlist[$i]};
8134                 my $commit = $co{'id'};
8135                 # we read 150, we always show 30 and the ones more recent than 48 hours
8136                 if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
8137                         last;
8138                 }
8139                 my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
8140
8141                 # get list of changed files
8142                 open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
8143                         $co{'parent'} || "--root",
8144                         $co{'id'}, "--", (defined $file_name ? $file_name : ())
8145                         or next;
8146                 my @difftree = map { chomp; $_ } <$fd>;
8147                 close $fd
8148                         or next;
8149
8150                 # print element (entry, item)
8151                 my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
8152                 if ($format eq 'rss') {
8153                         print "<item>\n" .
8154                               "<title>" . esc_html($co{'title'}) . "</title>\n" .
8155                               "<author>" . esc_html($co{'author'}) . "</author>\n" .
8156                               "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
8157                               "<guid isPermaLink=\"true\">$co_url</guid>\n" .
8158                               "<link>$co_url</link>\n" .
8159                               "<description>" . esc_html($co{'title'}) . "</description>\n" .
8160                               "<content:encoded>" .
8161                               "<![CDATA[\n";
8162                 } elsif ($format eq 'atom') {
8163                         print "<entry>\n" .
8164                               "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
8165                               "<updated>$cd{'iso-8601'}</updated>\n" .
8166                               "<author>\n" .
8167                               "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
8168                         if ($co{'author_email'}) {
8169                                 print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
8170                         }
8171                         print "</author>\n" .
8172                               # use committer for contributor
8173                               "<contributor>\n" .
8174                               "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
8175                         if ($co{'committer_email'}) {
8176                                 print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
8177                         }
8178                         print "</contributor>\n" .
8179                               "<published>$cd{'iso-8601'}</published>\n" .
8180                               "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
8181                               "<id>$co_url</id>\n" .
8182                               "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
8183                               "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
8184                 }
8185                 my $comment = $co{'comment'};
8186                 print "<pre>\n";
8187                 foreach my $line (@$comment) {
8188                         $line = esc_html($line);
8189                         print "$line\n";
8190                 }
8191                 print "</pre><ul>\n";
8192                 foreach my $difftree_line (@difftree) {
8193                         my %difftree = parse_difftree_raw_line($difftree_line);
8194                         next if !$difftree{'from_id'};
8195
8196                         my $file = $difftree{'file'} || $difftree{'to_file'};
8197
8198                         print "<li>" .
8199                               "[" .
8200                               $cgi->a({-href => href(-full=>1, action=>"blobdiff",
8201                                                      hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
8202                                                      hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
8203                                                      file_name=>$file, file_parent=>$difftree{'from_file'}),
8204                                       -title => "diff"}, 'D');
8205                         if ($have_blame) {
8206                                 print $cgi->a({-href => href(-full=>1, action=>"blame",
8207                                                              file_name=>$file, hash_base=>$commit),
8208                                               -title => "blame"}, 'B');
8209                         }
8210                         # if this is not a feed of a file history
8211                         if (!defined $file_name || $file_name ne $file) {
8212                                 print $cgi->a({-href => href(-full=>1, action=>"history",
8213                                                              file_name=>$file, hash=>$commit),
8214                                               -title => "history"}, 'H');
8215                         }
8216                         $file = esc_path($file);
8217                         print "] ".
8218                               "$file</li>\n";
8219                 }
8220                 if ($format eq 'rss') {
8221                         print "</ul>]]>\n" .
8222                               "</content:encoded>\n" .
8223                               "</item>\n";
8224                 } elsif ($format eq 'atom') {
8225                         print "</ul>\n</div>\n" .
8226                               "</content>\n" .
8227                               "</entry>\n";
8228                 }
8229         }
8230
8231         # end of feed
8232         if ($format eq 'rss') {
8233                 print "</channel>\n</rss>\n";
8234         } elsif ($format eq 'atom') {
8235                 print "</feed>\n";
8236         }
8237 }
8238
8239 sub git_rss {
8240         git_feed('rss');
8241 }
8242
8243 sub git_atom {
8244         git_feed('atom');
8245 }
8246
8247 sub git_opml {
8248         my @list = git_get_projects_list($project_filter, $strict_export);
8249         if (!@list) {
8250                 die_error(404, "No projects found");
8251         }
8252
8253         print $cgi->header(
8254                 -type => 'text/xml',
8255                 -charset => 'utf-8',
8256                 -content_disposition => 'inline; filename="opml.xml"');
8257
8258         my $title = esc_html($site_name);
8259         my $filter = " within subdirectory ";
8260         if (defined $project_filter) {
8261                 $filter .= esc_html($project_filter);
8262         } else {
8263                 $filter = "";
8264         }
8265         print <<XML;
8266 <?xml version="1.0" encoding="utf-8"?>
8267 <opml version="1.0">
8268 <head>
8269   <title>$title OPML Export$filter</title>
8270 </head>
8271 <body>
8272 <outline text="git RSS feeds">
8273 XML
8274
8275         foreach my $pr (@list) {
8276                 my %proj = %$pr;
8277                 my $head = git_get_head_hash($proj{'path'});
8278                 if (!defined $head) {
8279                         next;
8280                 }
8281                 $git_dir = "$projectroot/$proj{'path'}";
8282                 my %co = parse_commit($head);
8283                 if (!%co) {
8284                         next;
8285                 }
8286
8287                 my $path = esc_html(chop_str($proj{'path'}, 25, 5));
8288                 my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
8289                 my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
8290                 print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
8291         }
8292         print <<XML;
8293 </outline>
8294 </body>
8295 </opml>
8296 XML
8297 }