Merge branch 'maint-1.7.11' into maint
[git.git] / gitweb / gitweb.perl
1 #!/usr/bin/perl
2
3 # gitweb - simple web interface to track changes in git repositories
4 #
5 # (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
6 # (C) 2005, Christian Gierke
7 #
8 # This program is licensed under the GPLv2
9
10 use 5.008;
11 use strict;
12 use warnings;
13 use CGI qw(:standard :escapeHTML -nosticky);
14 use CGI::Util qw(unescape);
15 use CGI::Carp qw(fatalsToBrowser set_message);
16 use Encode;
17 use Fcntl ':mode';
18 use File::Find qw();
19 use File::Basename qw(basename);
20 use Time::HiRes qw(gettimeofday tv_interval);
21 binmode STDOUT, ':utf8';
22
23 our $t0 = [ gettimeofday() ];
24 our $number_of_git_cmds = 0;
25
26 BEGIN {
27         CGI->compile() if $ENV{'MOD_PERL'};
28 }
29
30 our $version = "++GIT_VERSION++";
31
32 our ($my_url, $my_uri, $base_url, $path_info, $home_link);
33 sub evaluate_uri {
34         our $cgi;
35
36         our $my_url = $cgi->url();
37         our $my_uri = $cgi->url(-absolute => 1);
38
39         # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
40         # needed and used only for URLs with nonempty PATH_INFO
41         our $base_url = $my_url;
42
43         # When the script is used as DirectoryIndex, the URL does not contain the name
44         # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
45         # have to do it ourselves. We make $path_info global because it's also used
46         # later on.
47         #
48         # Another issue with the script being the DirectoryIndex is that the resulting
49         # $my_url data is not the full script URL: this is good, because we want
50         # generated links to keep implying the script name if it wasn't explicitly
51         # indicated in the URL we're handling, but it means that $my_url cannot be used
52         # as base URL.
53         # Therefore, if we needed to strip PATH_INFO, then we know that we have
54         # to build the base URL ourselves:
55         our $path_info = decode_utf8($ENV{"PATH_INFO"});
56         if ($path_info) {
57                 if ($my_url =~ s,\Q$path_info\E$,, &&
58                     $my_uri =~ s,\Q$path_info\E$,, &&
59                     defined $ENV{'SCRIPT_NAME'}) {
60                         $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
61                 }
62         }
63
64         # target of the home link on top of all pages
65         our $home_link = $my_uri || "/";
66 }
67
68 # core git executable to use
69 # this can just be "git" if your webserver has a sensible PATH
70 our $GIT = "++GIT_BINDIR++/git";
71
72 # absolute fs-path which will be prepended to the project path
73 #our $projectroot = "/pub/scm";
74 our $projectroot = "++GITWEB_PROJECTROOT++";
75
76 # fs traversing limit for getting project list
77 # the number is relative to the projectroot
78 our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
79
80 # string of the home link on top of all pages
81 our $home_link_str = "++GITWEB_HOME_LINK_STR++";
82
83 # name of your site or organization to appear in page titles
84 # replace this with something more descriptive for clearer bookmarks
85 our $site_name = "++GITWEB_SITENAME++"
86                  || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
87
88 # html snippet to include in the <head> section of each page
89 our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
90 # filename of html text to include at top of each page
91 our $site_header = "++GITWEB_SITE_HEADER++";
92 # html text to include at home page
93 our $home_text = "++GITWEB_HOMETEXT++";
94 # filename of html text to include at bottom of each page
95 our $site_footer = "++GITWEB_SITE_FOOTER++";
96
97 # URI of stylesheets
98 our @stylesheets = ("++GITWEB_CSS++");
99 # URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
100 our $stylesheet = undef;
101 # URI of GIT logo (72x27 size)
102 our $logo = "++GITWEB_LOGO++";
103 # URI of GIT favicon, assumed to be image/png type
104 our $favicon = "++GITWEB_FAVICON++";
105 # URI of gitweb.js (JavaScript code for gitweb)
106 our $javascript = "++GITWEB_JS++";
107
108 # URI and label (title) of GIT logo link
109 #our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
110 #our $logo_label = "git documentation";
111 our $logo_url = "http://git-scm.com/";
112 our $logo_label = "git homepage";
113
114 # source of projects list
115 our $projects_list = "++GITWEB_LIST++";
116
117 # the width (in characters) of the projects list "Description" column
118 our $projects_list_description_width = 25;
119
120 # group projects by category on the projects list
121 # (enabled if this variable evaluates to true)
122 our $projects_list_group_categories = 0;
123
124 # default category if none specified
125 # (leave the empty string for no category)
126 our $project_list_default_category = "";
127
128 # default order of projects list
129 # valid values are none, project, descr, owner, and age
130 our $default_projects_order = "project";
131
132 # show repository only if this file exists
133 # (only effective if this variable evaluates to true)
134 our $export_ok = "++GITWEB_EXPORT_OK++";
135
136 # don't generate age column on the projects list page
137 our $omit_age_column = 0;
138
139 # don't generate information about owners of repositories
140 our $omit_owner=0;
141
142 # show repository only if this subroutine returns true
143 # when given the path to the project, for example:
144 #    sub { return -e "$_[0]/git-daemon-export-ok"; }
145 our $export_auth_hook = undef;
146
147 # only allow viewing of repositories also shown on the overview page
148 our $strict_export = "++GITWEB_STRICT_EXPORT++";
149
150 # list of git base URLs used for URL to where fetch project from,
151 # i.e. full URL is "$git_base_url/$project"
152 our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
153
154 # default blob_plain mimetype and default charset for text/plain blob
155 our $default_blob_plain_mimetype = 'text/plain';
156 our $default_text_plain_charset  = undef;
157
158 # file to use for guessing MIME types before trying /etc/mime.types
159 # (relative to the current git repository)
160 our $mimetypes_file = undef;
161
162 # assume this charset if line contains non-UTF-8 characters;
163 # it should be valid encoding (see Encoding::Supported(3pm) for list),
164 # for which encoding all byte sequences are valid, for example
165 # 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
166 # could be even 'utf-8' for the old behavior)
167 our $fallback_encoding = 'latin1';
168
169 # rename detection options for git-diff and git-diff-tree
170 # - default is '-M', with the cost proportional to
171 #   (number of removed files) * (number of new files).
172 # - more costly is '-C' (which implies '-M'), with the cost proportional to
173 #   (number of changed files + number of removed files) * (number of new files)
174 # - even more costly is '-C', '--find-copies-harder' with cost
175 #   (number of files in the original tree) * (number of new files)
176 # - one might want to include '-B' option, e.g. '-B', '-M'
177 our @diff_opts = ('-M'); # taken from git_commit
178
179 # Disables features that would allow repository owners to inject script into
180 # the gitweb domain.
181 our $prevent_xss = 0;
182
183 # Path to the highlight executable to use (must be the one from
184 # http://www.andre-simon.de due to assumptions about parameters and output).
185 # Useful if highlight is not installed on your webserver's PATH.
186 # [Default: highlight]
187 our $highlight_bin = "++HIGHLIGHT_BIN++";
188
189 # information about snapshot formats that gitweb is capable of serving
190 our %known_snapshot_formats = (
191         # name => {
192         #       'display' => display name,
193         #       'type' => mime type,
194         #       'suffix' => filename suffix,
195         #       'format' => --format for git-archive,
196         #       'compressor' => [compressor command and arguments]
197         #                       (array reference, optional)
198         #       'disabled' => boolean (optional)}
199         #
200         'tgz' => {
201                 'display' => 'tar.gz',
202                 'type' => 'application/x-gzip',
203                 'suffix' => '.tar.gz',
204                 'format' => 'tar',
205                 'compressor' => ['gzip', '-n']},
206
207         'tbz2' => {
208                 'display' => 'tar.bz2',
209                 'type' => 'application/x-bzip2',
210                 'suffix' => '.tar.bz2',
211                 'format' => 'tar',
212                 'compressor' => ['bzip2']},
213
214         'txz' => {
215                 'display' => 'tar.xz',
216                 'type' => 'application/x-xz',
217                 'suffix' => '.tar.xz',
218                 'format' => 'tar',
219                 'compressor' => ['xz'],
220                 'disabled' => 1},
221
222         'zip' => {
223                 'display' => 'zip',
224                 'type' => 'application/x-zip',
225                 'suffix' => '.zip',
226                 'format' => 'zip'},
227 );
228
229 # Aliases so we understand old gitweb.snapshot values in repository
230 # configuration.
231 our %known_snapshot_format_aliases = (
232         'gzip'  => 'tgz',
233         'bzip2' => 'tbz2',
234         'xz'    => 'txz',
235
236         # backward compatibility: legacy gitweb config support
237         'x-gzip' => undef, 'gz' => undef,
238         'x-bzip2' => undef, 'bz2' => undef,
239         'x-zip' => undef, '' => undef,
240 );
241
242 # Pixel sizes for icons and avatars. If the default font sizes or lineheights
243 # are changed, it may be appropriate to change these values too via
244 # $GITWEB_CONFIG.
245 our %avatar_size = (
246         'default' => 16,
247         'double'  => 32
248 );
249
250 # Used to set the maximum load that we will still respond to gitweb queries.
251 # If server load exceed this value then return "503 server busy" error.
252 # If gitweb cannot determined server load, it is taken to be 0.
253 # Leave it undefined (or set to 'undef') to turn off load checking.
254 our $maxload = 300;
255
256 # configuration for 'highlight' (http://www.andre-simon.de/)
257 # match by basename
258 our %highlight_basename = (
259         #'Program' => 'py',
260         #'Library' => 'py',
261         'SConstruct' => 'py', # SCons equivalent of Makefile
262         'Makefile' => 'make',
263 );
264 # match by extension
265 our %highlight_ext = (
266         # main extensions, defining name of syntax;
267         # see files in /usr/share/highlight/langDefs/ directory
268         map { $_ => $_ }
269                 qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
270         # alternate extensions, see /etc/highlight/filetypes.conf
271         'h' => 'c',
272         map { $_ => 'sh'  } qw(bash zsh ksh),
273         map { $_ => 'cpp' } qw(cxx c++ cc),
274         map { $_ => 'php' } qw(php3 php4 php5 phps),
275         map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
276         map { $_ => 'make'} qw(mak mk),
277         map { $_ => 'xml' } qw(xhtml html htm),
278 );
279
280 # You define site-wide feature defaults here; override them with
281 # $GITWEB_CONFIG as necessary.
282 our %feature = (
283         # feature => {
284         #       'sub' => feature-sub (subroutine),
285         #       'override' => allow-override (boolean),
286         #       'default' => [ default options...] (array reference)}
287         #
288         # if feature is overridable (it means that allow-override has true value),
289         # then feature-sub will be called with default options as parameters;
290         # return value of feature-sub indicates if to enable specified feature
291         #
292         # if there is no 'sub' key (no feature-sub), then feature cannot be
293         # overridden
294         #
295         # use gitweb_get_feature(<feature>) to retrieve the <feature> value
296         # (an array) or gitweb_check_feature(<feature>) to check if <feature>
297         # is enabled
298
299         # Enable the 'blame' blob view, showing the last commit that modified
300         # each line in the file. This can be very CPU-intensive.
301
302         # To enable system wide have in $GITWEB_CONFIG
303         # $feature{'blame'}{'default'} = [1];
304         # To have project specific config enable override in $GITWEB_CONFIG
305         # $feature{'blame'}{'override'} = 1;
306         # and in project config gitweb.blame = 0|1;
307         'blame' => {
308                 'sub' => sub { feature_bool('blame', @_) },
309                 'override' => 0,
310                 'default' => [0]},
311
312         # Enable the 'snapshot' link, providing a compressed archive of any
313         # tree. This can potentially generate high traffic if you have large
314         # project.
315
316         # Value is a list of formats defined in %known_snapshot_formats that
317         # you wish to offer.
318         # To disable system wide have in $GITWEB_CONFIG
319         # $feature{'snapshot'}{'default'} = [];
320         # To have project specific config enable override in $GITWEB_CONFIG
321         # $feature{'snapshot'}{'override'} = 1;
322         # and in project config, a comma-separated list of formats or "none"
323         # to disable.  Example: gitweb.snapshot = tbz2,zip;
324         'snapshot' => {
325                 'sub' => \&feature_snapshot,
326                 'override' => 0,
327                 'default' => ['tgz']},
328
329         # Enable text search, which will list the commits which match author,
330         # committer or commit text to a given string.  Enabled by default.
331         # Project specific override is not supported.
332         #
333         # Note that this controls all search features, which means that if
334         # it is disabled, then 'grep' and 'pickaxe' search would also be
335         # disabled.
336         'search' => {
337                 'override' => 0,
338                 'default' => [1]},
339
340         # Enable grep search, which will list the files in currently selected
341         # tree containing the given string. Enabled by default. This can be
342         # potentially CPU-intensive, of course.
343         # Note that you need to have 'search' feature enabled too.
344
345         # To enable system wide have in $GITWEB_CONFIG
346         # $feature{'grep'}{'default'} = [1];
347         # To have project specific config enable override in $GITWEB_CONFIG
348         # $feature{'grep'}{'override'} = 1;
349         # and in project config gitweb.grep = 0|1;
350         'grep' => {
351                 'sub' => sub { feature_bool('grep', @_) },
352                 'override' => 0,
353                 'default' => [1]},
354
355         # Enable the pickaxe search, which will list the commits that modified
356         # a given string in a file. This can be practical and quite faster
357         # alternative to 'blame', but still potentially CPU-intensive.
358         # Note that you need to have 'search' feature enabled too.
359
360         # To enable system wide have in $GITWEB_CONFIG
361         # $feature{'pickaxe'}{'default'} = [1];
362         # To have project specific config enable override in $GITWEB_CONFIG
363         # $feature{'pickaxe'}{'override'} = 1;
364         # and in project config gitweb.pickaxe = 0|1;
365         'pickaxe' => {
366                 'sub' => sub { feature_bool('pickaxe', @_) },
367                 'override' => 0,
368                 'default' => [1]},
369
370         # Enable showing size of blobs in a 'tree' view, in a separate
371         # column, similar to what 'ls -l' does.  This cost a bit of IO.
372
373         # To disable system wide have in $GITWEB_CONFIG
374         # $feature{'show-sizes'}{'default'} = [0];
375         # To have project specific config enable override in $GITWEB_CONFIG
376         # $feature{'show-sizes'}{'override'} = 1;
377         # and in project config gitweb.showsizes = 0|1;
378         'show-sizes' => {
379                 'sub' => sub { feature_bool('showsizes', @_) },
380                 'override' => 0,
381                 'default' => [1]},
382
383         # Make gitweb use an alternative format of the URLs which can be
384         # more readable and natural-looking: project name is embedded
385         # directly in the path and the query string contains other
386         # auxiliary information. All gitweb installations recognize
387         # URL in either format; this configures in which formats gitweb
388         # generates links.
389
390         # To enable system wide have in $GITWEB_CONFIG
391         # $feature{'pathinfo'}{'default'} = [1];
392         # Project specific override is not supported.
393
394         # Note that you will need to change the default location of CSS,
395         # favicon, logo and possibly other files to an absolute URL. Also,
396         # if gitweb.cgi serves as your indexfile, you will need to force
397         # $my_uri to contain the script name in your $GITWEB_CONFIG.
398         'pathinfo' => {
399                 'override' => 0,
400                 'default' => [0]},
401
402         # Make gitweb consider projects in project root subdirectories
403         # to be forks of existing projects. Given project $projname.git,
404         # projects matching $projname/*.git will not be shown in the main
405         # projects list, instead a '+' mark will be added to $projname
406         # there and a 'forks' view will be enabled for the project, listing
407         # all the forks. If project list is taken from a file, forks have
408         # to be listed after the main project.
409
410         # To enable system wide have in $GITWEB_CONFIG
411         # $feature{'forks'}{'default'} = [1];
412         # Project specific override is not supported.
413         'forks' => {
414                 'override' => 0,
415                 'default' => [0]},
416
417         # Insert custom links to the action bar of all project pages.
418         # This enables you mainly to link to third-party scripts integrating
419         # into gitweb; e.g. git-browser for graphical history representation
420         # or custom web-based repository administration interface.
421
422         # The 'default' value consists of a list of triplets in the form
423         # (label, link, position) where position is the label after which
424         # to insert the link and link is a format string where %n expands
425         # to the project name, %f to the project path within the filesystem,
426         # %h to the current hash (h gitweb parameter) and %b to the current
427         # hash base (hb gitweb parameter); %% expands to %.
428
429         # To enable system wide have in $GITWEB_CONFIG e.g.
430         # $feature{'actions'}{'default'} = [('graphiclog',
431         #       '/git-browser/by-commit.html?r=%n', 'summary')];
432         # Project specific override is not supported.
433         'actions' => {
434                 'override' => 0,
435                 'default' => []},
436
437         # Allow gitweb scan project content tags of project repository,
438         # and display the popular Web 2.0-ish "tag cloud" near the projects
439         # list.  Note that this is something COMPLETELY different from the
440         # normal Git tags.
441
442         # gitweb by itself can show existing tags, but it does not handle
443         # tagging itself; you need to do it externally, outside gitweb.
444         # The format is described in git_get_project_ctags() subroutine.
445         # You may want to install the HTML::TagCloud Perl module to get
446         # a pretty tag cloud instead of just a list of tags.
447
448         # To enable system wide have in $GITWEB_CONFIG
449         # $feature{'ctags'}{'default'} = [1];
450         # Project specific override is not supported.
451
452         # In the future whether ctags editing is enabled might depend
453         # on the value, but using 1 should always mean no editing of ctags.
454         'ctags' => {
455                 'override' => 0,
456                 'default' => [0]},
457
458         # The maximum number of patches in a patchset generated in patch
459         # view. Set this to 0 or undef to disable patch view, or to a
460         # negative number to remove any limit.
461
462         # To disable system wide have in $GITWEB_CONFIG
463         # $feature{'patches'}{'default'} = [0];
464         # To have project specific config enable override in $GITWEB_CONFIG
465         # $feature{'patches'}{'override'} = 1;
466         # and in project config gitweb.patches = 0|n;
467         # where n is the maximum number of patches allowed in a patchset.
468         'patches' => {
469                 'sub' => \&feature_patches,
470                 'override' => 0,
471                 'default' => [16]},
472
473         # Avatar support. When this feature is enabled, views such as
474         # shortlog or commit will display an avatar associated with
475         # the email of the committer(s) and/or author(s).
476
477         # Currently available providers are gravatar and picon.
478         # If an unknown provider is specified, the feature is disabled.
479
480         # Gravatar depends on Digest::MD5.
481         # Picon currently relies on the indiana.edu database.
482
483         # To enable system wide have in $GITWEB_CONFIG
484         # $feature{'avatar'}{'default'} = ['<provider>'];
485         # where <provider> is either gravatar or picon.
486         # To have project specific config enable override in $GITWEB_CONFIG
487         # $feature{'avatar'}{'override'} = 1;
488         # and in project config gitweb.avatar = <provider>;
489         'avatar' => {
490                 'sub' => \&feature_avatar,
491                 'override' => 0,
492                 'default' => ['']},
493
494         # Enable displaying how much time and how many git commands
495         # it took to generate and display page.  Disabled by default.
496         # Project specific override is not supported.
497         'timed' => {
498                 'override' => 0,
499                 'default' => [0]},
500
501         # Enable turning some links into links to actions which require
502         # JavaScript to run (like 'blame_incremental').  Not enabled by
503         # default.  Project specific override is currently not supported.
504         'javascript-actions' => {
505                 'override' => 0,
506                 'default' => [0]},
507
508         # Enable and configure ability to change common timezone for dates
509         # in gitweb output via JavaScript.  Enabled by default.
510         # Project specific override is not supported.
511         'javascript-timezone' => {
512                 'override' => 0,
513                 'default' => [
514                         'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
515                                      # or undef to turn off this feature
516                         'gitweb_tz', # name of cookie where to store selected timezone
517                         'datetime',  # CSS class used to mark up dates for manipulation
518                 ]},
519
520         # Syntax highlighting support. This is based on Daniel Svensson's
521         # and Sham Chukoury's work in gitweb-xmms2.git.
522         # It requires the 'highlight' program present in $PATH,
523         # and therefore is disabled by default.
524
525         # To enable system wide have in $GITWEB_CONFIG
526         # $feature{'highlight'}{'default'} = [1];
527
528         'highlight' => {
529                 'sub' => sub { feature_bool('highlight', @_) },
530                 'override' => 0,
531                 'default' => [0]},
532
533         # Enable displaying of remote heads in the heads list
534
535         # To enable system wide have in $GITWEB_CONFIG
536         # $feature{'remote_heads'}{'default'} = [1];
537         # To have project specific config enable override in $GITWEB_CONFIG
538         # $feature{'remote_heads'}{'override'} = 1;
539         # and in project config gitweb.remote_heads = 0|1;
540         'remote_heads' => {
541                 'sub' => sub { feature_bool('remote_heads', @_) },
542                 'override' => 0,
543                 'default' => [0]},
544 );
545
546 sub gitweb_get_feature {
547         my ($name) = @_;
548         return unless exists $feature{$name};
549         my ($sub, $override, @defaults) = (
550                 $feature{$name}{'sub'},
551                 $feature{$name}{'override'},
552                 @{$feature{$name}{'default'}});
553         # project specific override is possible only if we have project
554         our $git_dir; # global variable, declared later
555         if (!$override || !defined $git_dir) {
556                 return @defaults;
557         }
558         if (!defined $sub) {
559                 warn "feature $name is not overridable";
560                 return @defaults;
561         }
562         return $sub->(@defaults);
563 }
564
565 # A wrapper to check if a given feature is enabled.
566 # With this, you can say
567 #
568 #   my $bool_feat = gitweb_check_feature('bool_feat');
569 #   gitweb_check_feature('bool_feat') or somecode;
570 #
571 # instead of
572 #
573 #   my ($bool_feat) = gitweb_get_feature('bool_feat');
574 #   (gitweb_get_feature('bool_feat'))[0] or somecode;
575 #
576 sub gitweb_check_feature {
577         return (gitweb_get_feature(@_))[0];
578 }
579
580
581 sub feature_bool {
582         my $key = shift;
583         my ($val) = git_get_project_config($key, '--bool');
584
585         if (!defined $val) {
586                 return ($_[0]);
587         } elsif ($val eq 'true') {
588                 return (1);
589         } elsif ($val eq 'false') {
590                 return (0);
591         }
592 }
593
594 sub feature_snapshot {
595         my (@fmts) = @_;
596
597         my ($val) = git_get_project_config('snapshot');
598
599         if ($val) {
600                 @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
601         }
602
603         return @fmts;
604 }
605
606 sub feature_patches {
607         my @val = (git_get_project_config('patches', '--int'));
608
609         if (@val) {
610                 return @val;
611         }
612
613         return ($_[0]);
614 }
615
616 sub feature_avatar {
617         my @val = (git_get_project_config('avatar'));
618
619         return @val ? @val : @_;
620 }
621
622 # checking HEAD file with -e is fragile if the repository was
623 # initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
624 # and then pruned.
625 sub check_head_link {
626         my ($dir) = @_;
627         my $headfile = "$dir/HEAD";
628         return ((-e $headfile) ||
629                 (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
630 }
631
632 sub check_export_ok {
633         my ($dir) = @_;
634         return (check_head_link($dir) &&
635                 (!$export_ok || -e "$dir/$export_ok") &&
636                 (!$export_auth_hook || $export_auth_hook->($dir)));
637 }
638
639 # process alternate names for backward compatibility
640 # filter out unsupported (unknown) snapshot formats
641 sub filter_snapshot_fmts {
642         my @fmts = @_;
643
644         @fmts = map {
645                 exists $known_snapshot_format_aliases{$_} ?
646                        $known_snapshot_format_aliases{$_} : $_} @fmts;
647         @fmts = grep {
648                 exists $known_snapshot_formats{$_} &&
649                 !$known_snapshot_formats{$_}{'disabled'}} @fmts;
650 }
651
652 # If it is set to code reference, it is code that it is to be run once per
653 # request, allowing updating configurations that change with each request,
654 # while running other code in config file only once.
655 #
656 # Otherwise, if it is false then gitweb would process config file only once;
657 # if it is true then gitweb config would be run for each request.
658 our $per_request_config = 1;
659
660 # read and parse gitweb config file given by its parameter.
661 # returns true on success, false on recoverable error, allowing
662 # to chain this subroutine, using first file that exists.
663 # dies on errors during parsing config file, as it is unrecoverable.
664 sub read_config_file {
665         my $filename = shift;
666         return unless defined $filename;
667         # die if there are errors parsing config file
668         if (-e $filename) {
669                 do $filename;
670                 die $@ if $@;
671                 return 1;
672         }
673         return;
674 }
675
676 our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
677 sub evaluate_gitweb_config {
678         our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
679         our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
680         our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
681
682         # Protect agains duplications of file names, to not read config twice.
683         # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
684         # there possibility of duplication of filename there doesn't matter.
685         $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
686         $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
687
688         # Common system-wide settings for convenience.
689         # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
690         read_config_file($GITWEB_CONFIG_COMMON);
691
692         # Use first config file that exists.  This means use the per-instance
693         # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
694         read_config_file($GITWEB_CONFIG) and return;
695         read_config_file($GITWEB_CONFIG_SYSTEM);
696 }
697
698 # Get loadavg of system, to compare against $maxload.
699 # Currently it requires '/proc/loadavg' present to get loadavg;
700 # if it is not present it returns 0, which means no load checking.
701 sub get_loadavg {
702         if( -e '/proc/loadavg' ){
703                 open my $fd, '<', '/proc/loadavg'
704                         or return 0;
705                 my @load = split(/\s+/, scalar <$fd>);
706                 close $fd;
707
708                 # The first three columns measure CPU and IO utilization of the last one,
709                 # five, and 10 minute periods.  The fourth column shows the number of
710                 # currently running processes and the total number of processes in the m/n
711                 # format.  The last column displays the last process ID used.
712                 return $load[0] || 0;
713         }
714         # additional checks for load average should go here for things that don't export
715         # /proc/loadavg
716
717         return 0;
718 }
719
720 # version of the core git binary
721 our $git_version;
722 sub evaluate_git_version {
723         our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
724         $number_of_git_cmds++;
725 }
726
727 sub check_loadavg {
728         if (defined $maxload && get_loadavg() > $maxload) {
729                 die_error(503, "The load average on the server is too high");
730         }
731 }
732
733 # ======================================================================
734 # input validation and dispatch
735
736 # input parameters can be collected from a variety of sources (presently, CGI
737 # and PATH_INFO), so we define an %input_params hash that collects them all
738 # together during validation: this allows subsequent uses (e.g. href()) to be
739 # agnostic of the parameter origin
740
741 our %input_params = ();
742
743 # input parameters are stored with the long parameter name as key. This will
744 # also be used in the href subroutine to convert parameters to their CGI
745 # equivalent, and since the href() usage is the most frequent one, we store
746 # the name -> CGI key mapping here, instead of the reverse.
747 #
748 # XXX: Warning: If you touch this, check the search form for updating,
749 # too.
750
751 our @cgi_param_mapping = (
752         project => "p",
753         action => "a",
754         file_name => "f",
755         file_parent => "fp",
756         hash => "h",
757         hash_parent => "hp",
758         hash_base => "hb",
759         hash_parent_base => "hpb",
760         page => "pg",
761         order => "o",
762         searchtext => "s",
763         searchtype => "st",
764         snapshot_format => "sf",
765         extra_options => "opt",
766         search_use_regexp => "sr",
767         ctag => "by_tag",
768         diff_style => "ds",
769         project_filter => "pf",
770         # this must be last entry (for manipulation from JavaScript)
771         javascript => "js"
772 );
773 our %cgi_param_mapping = @cgi_param_mapping;
774
775 # we will also need to know the possible actions, for validation
776 our %actions = (
777         "blame" => \&git_blame,
778         "blame_incremental" => \&git_blame_incremental,
779         "blame_data" => \&git_blame_data,
780         "blobdiff" => \&git_blobdiff,
781         "blobdiff_plain" => \&git_blobdiff_plain,
782         "blob" => \&git_blob,
783         "blob_plain" => \&git_blob_plain,
784         "commitdiff" => \&git_commitdiff,
785         "commitdiff_plain" => \&git_commitdiff_plain,
786         "commit" => \&git_commit,
787         "forks" => \&git_forks,
788         "heads" => \&git_heads,
789         "history" => \&git_history,
790         "log" => \&git_log,
791         "patch" => \&git_patch,
792         "patches" => \&git_patches,
793         "remotes" => \&git_remotes,
794         "rss" => \&git_rss,
795         "atom" => \&git_atom,
796         "search" => \&git_search,
797         "search_help" => \&git_search_help,
798         "shortlog" => \&git_shortlog,
799         "summary" => \&git_summary,
800         "tag" => \&git_tag,
801         "tags" => \&git_tags,
802         "tree" => \&git_tree,
803         "snapshot" => \&git_snapshot,
804         "object" => \&git_object,
805         # those below don't need $project
806         "opml" => \&git_opml,
807         "project_list" => \&git_project_list,
808         "project_index" => \&git_project_index,
809 );
810
811 # finally, we have the hash of allowed extra_options for the commands that
812 # allow them
813 our %allowed_options = (
814         "--no-merges" => [ qw(rss atom log shortlog history) ],
815 );
816
817 # fill %input_params with the CGI parameters. All values except for 'opt'
818 # should be single values, but opt can be an array. We should probably
819 # build an array of parameters that can be multi-valued, but since for the time
820 # being it's only this one, we just single it out
821 sub evaluate_query_params {
822         our $cgi;
823
824         while (my ($name, $symbol) = each %cgi_param_mapping) {
825                 if ($symbol eq 'opt') {
826                         $input_params{$name} = [ map { decode_utf8($_) } $cgi->param($symbol) ];
827                 } else {
828                         $input_params{$name} = decode_utf8($cgi->param($symbol));
829                 }
830         }
831 }
832
833 # now read PATH_INFO and update the parameter list for missing parameters
834 sub evaluate_path_info {
835         return if defined $input_params{'project'};
836         return if !$path_info;
837         $path_info =~ s,^/+,,;
838         return if !$path_info;
839
840         # find which part of PATH_INFO is project
841         my $project = $path_info;
842         $project =~ s,/+$,,;
843         while ($project && !check_head_link("$projectroot/$project")) {
844                 $project =~ s,/*[^/]*$,,;
845         }
846         return unless $project;
847         $input_params{'project'} = $project;
848
849         # do not change any parameters if an action is given using the query string
850         return if $input_params{'action'};
851         $path_info =~ s,^\Q$project\E/*,,;
852
853         # next, check if we have an action
854         my $action = $path_info;
855         $action =~ s,/.*$,,;
856         if (exists $actions{$action}) {
857                 $path_info =~ s,^$action/*,,;
858                 $input_params{'action'} = $action;
859         }
860
861         # list of actions that want hash_base instead of hash, but can have no
862         # pathname (f) parameter
863         my @wants_base = (
864                 'tree',
865                 'history',
866         );
867
868         # we want to catch, among others
869         # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
870         my ($parentrefname, $parentpathname, $refname, $pathname) =
871                 ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
872
873         # first, analyze the 'current' part
874         if (defined $pathname) {
875                 # we got "branch:filename" or "branch:dir/"
876                 # we could use git_get_type(branch:pathname), but:
877                 # - it needs $git_dir
878                 # - it does a git() call
879                 # - the convention of terminating directories with a slash
880                 #   makes it superfluous
881                 # - embedding the action in the PATH_INFO would make it even
882                 #   more superfluous
883                 $pathname =~ s,^/+,,;
884                 if (!$pathname || substr($pathname, -1) eq "/") {
885                         $input_params{'action'} ||= "tree";
886                         $pathname =~ s,/$,,;
887                 } else {
888                         # the default action depends on whether we had parent info
889                         # or not
890                         if ($parentrefname) {
891                                 $input_params{'action'} ||= "blobdiff_plain";
892                         } else {
893                                 $input_params{'action'} ||= "blob_plain";
894                         }
895                 }
896                 $input_params{'hash_base'} ||= $refname;
897                 $input_params{'file_name'} ||= $pathname;
898         } elsif (defined $refname) {
899                 # we got "branch". In this case we have to choose if we have to
900                 # set hash or hash_base.
901                 #
902                 # Most of the actions without a pathname only want hash to be
903                 # set, except for the ones specified in @wants_base that want
904                 # hash_base instead. It should also be noted that hand-crafted
905                 # links having 'history' as an action and no pathname or hash
906                 # set will fail, but that happens regardless of PATH_INFO.
907                 if (defined $parentrefname) {
908                         # if there is parent let the default be 'shortlog' action
909                         # (for http://git.example.com/repo.git/A..B links); if there
910                         # is no parent, dispatch will detect type of object and set
911                         # action appropriately if required (if action is not set)
912                         $input_params{'action'} ||= "shortlog";
913                 }
914                 if ($input_params{'action'} &&
915                     grep { $_ eq $input_params{'action'} } @wants_base) {
916                         $input_params{'hash_base'} ||= $refname;
917                 } else {
918                         $input_params{'hash'} ||= $refname;
919                 }
920         }
921
922         # next, handle the 'parent' part, if present
923         if (defined $parentrefname) {
924                 # a missing pathspec defaults to the 'current' filename, allowing e.g.
925                 # someproject/blobdiff/oldrev..newrev:/filename
926                 if ($parentpathname) {
927                         $parentpathname =~ s,^/+,,;
928                         $parentpathname =~ s,/$,,;
929                         $input_params{'file_parent'} ||= $parentpathname;
930                 } else {
931                         $input_params{'file_parent'} ||= $input_params{'file_name'};
932                 }
933                 # we assume that hash_parent_base is wanted if a path was specified,
934                 # or if the action wants hash_base instead of hash
935                 if (defined $input_params{'file_parent'} ||
936                         grep { $_ eq $input_params{'action'} } @wants_base) {
937                         $input_params{'hash_parent_base'} ||= $parentrefname;
938                 } else {
939                         $input_params{'hash_parent'} ||= $parentrefname;
940                 }
941         }
942
943         # for the snapshot action, we allow URLs in the form
944         # $project/snapshot/$hash.ext
945         # where .ext determines the snapshot and gets removed from the
946         # passed $refname to provide the $hash.
947         #
948         # To be able to tell that $refname includes the format extension, we
949         # require the following two conditions to be satisfied:
950         # - the hash input parameter MUST have been set from the $refname part
951         #   of the URL (i.e. they must be equal)
952         # - the snapshot format MUST NOT have been defined already (e.g. from
953         #   CGI parameter sf)
954         # It's also useless to try any matching unless $refname has a dot,
955         # so we check for that too
956         if (defined $input_params{'action'} &&
957                 $input_params{'action'} eq 'snapshot' &&
958                 defined $refname && index($refname, '.') != -1 &&
959                 $refname eq $input_params{'hash'} &&
960                 !defined $input_params{'snapshot_format'}) {
961                 # We loop over the known snapshot formats, checking for
962                 # extensions. Allowed extensions are both the defined suffix
963                 # (which includes the initial dot already) and the snapshot
964                 # format key itself, with a prepended dot
965                 while (my ($fmt, $opt) = each %known_snapshot_formats) {
966                         my $hash = $refname;
967                         unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
968                                 next;
969                         }
970                         my $sfx = $1;
971                         # a valid suffix was found, so set the snapshot format
972                         # and reset the hash parameter
973                         $input_params{'snapshot_format'} = $fmt;
974                         $input_params{'hash'} = $hash;
975                         # we also set the format suffix to the one requested
976                         # in the URL: this way a request for e.g. .tgz returns
977                         # a .tgz instead of a .tar.gz
978                         $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
979                         last;
980                 }
981         }
982 }
983
984 our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
985      $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
986      $searchtext, $search_regexp, $project_filter);
987 sub evaluate_and_validate_params {
988         our $action = $input_params{'action'};
989         if (defined $action) {
990                 if (!validate_action($action)) {
991                         die_error(400, "Invalid action parameter");
992                 }
993         }
994
995         # parameters which are pathnames
996         our $project = $input_params{'project'};
997         if (defined $project) {
998                 if (!validate_project($project)) {
999                         undef $project;
1000                         die_error(404, "No such project");
1001                 }
1002         }
1003
1004         our $project_filter = $input_params{'project_filter'};
1005         if (defined $project_filter) {
1006                 if (!validate_pathname($project_filter)) {
1007                         die_error(404, "Invalid project_filter parameter");
1008                 }
1009         }
1010
1011         our $file_name = $input_params{'file_name'};
1012         if (defined $file_name) {
1013                 if (!validate_pathname($file_name)) {
1014                         die_error(400, "Invalid file parameter");
1015                 }
1016         }
1017
1018         our $file_parent = $input_params{'file_parent'};
1019         if (defined $file_parent) {
1020                 if (!validate_pathname($file_parent)) {
1021                         die_error(400, "Invalid file parent parameter");
1022                 }
1023         }
1024
1025         # parameters which are refnames
1026         our $hash = $input_params{'hash'};
1027         if (defined $hash) {
1028                 if (!validate_refname($hash)) {
1029                         die_error(400, "Invalid hash parameter");
1030                 }
1031         }
1032
1033         our $hash_parent = $input_params{'hash_parent'};
1034         if (defined $hash_parent) {
1035                 if (!validate_refname($hash_parent)) {
1036                         die_error(400, "Invalid hash parent parameter");
1037                 }
1038         }
1039
1040         our $hash_base = $input_params{'hash_base'};
1041         if (defined $hash_base) {
1042                 if (!validate_refname($hash_base)) {
1043                         die_error(400, "Invalid hash base parameter");
1044                 }
1045         }
1046
1047         our @extra_options = @{$input_params{'extra_options'}};
1048         # @extra_options is always defined, since it can only be (currently) set from
1049         # CGI, and $cgi->param() returns the empty array in array context if the param
1050         # is not set
1051         foreach my $opt (@extra_options) {
1052                 if (not exists $allowed_options{$opt}) {
1053                         die_error(400, "Invalid option parameter");
1054                 }
1055                 if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1056                         die_error(400, "Invalid option parameter for this action");
1057                 }
1058         }
1059
1060         our $hash_parent_base = $input_params{'hash_parent_base'};
1061         if (defined $hash_parent_base) {
1062                 if (!validate_refname($hash_parent_base)) {
1063                         die_error(400, "Invalid hash parent base parameter");
1064                 }
1065         }
1066
1067         # other parameters
1068         our $page = $input_params{'page'};
1069         if (defined $page) {
1070                 if ($page =~ m/[^0-9]/) {
1071                         die_error(400, "Invalid page parameter");
1072                 }
1073         }
1074
1075         our $searchtype = $input_params{'searchtype'};
1076         if (defined $searchtype) {
1077                 if ($searchtype =~ m/[^a-z]/) {
1078                         die_error(400, "Invalid searchtype parameter");
1079                 }
1080         }
1081
1082         our $search_use_regexp = $input_params{'search_use_regexp'};
1083
1084         our $searchtext = $input_params{'searchtext'};
1085         our $search_regexp;
1086         if (defined $searchtext) {
1087                 if (length($searchtext) < 2) {
1088                         die_error(403, "At least two characters are required for search parameter");
1089                 }
1090                 if ($search_use_regexp) {
1091                         $search_regexp = $searchtext;
1092                         if (!eval { qr/$search_regexp/; 1; }) {
1093                                 (my $error = $@) =~ s/ at \S+ line \d+.*\n?//;
1094                                 die_error(400, "Invalid search regexp '$search_regexp'",
1095                                           esc_html($error));
1096                         }
1097                 } else {
1098                         $search_regexp = quotemeta $searchtext;
1099                 }
1100         }
1101 }
1102
1103 # path to the current git repository
1104 our $git_dir;
1105 sub evaluate_git_dir {
1106         our $git_dir = "$projectroot/$project" if $project;
1107 }
1108
1109 our (@snapshot_fmts, $git_avatar);
1110 sub configure_gitweb_features {
1111         # list of supported snapshot formats
1112         our @snapshot_fmts = gitweb_get_feature('snapshot');
1113         @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1114
1115         # check that the avatar feature is set to a known provider name,
1116         # and for each provider check if the dependencies are satisfied.
1117         # if the provider name is invalid or the dependencies are not met,
1118         # reset $git_avatar to the empty string.
1119         our ($git_avatar) = gitweb_get_feature('avatar');
1120         if ($git_avatar eq 'gravatar') {
1121                 $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1122         } elsif ($git_avatar eq 'picon') {
1123                 # no dependencies
1124         } else {
1125                 $git_avatar = '';
1126         }
1127 }
1128
1129 # custom error handler: 'die <message>' is Internal Server Error
1130 sub handle_errors_html {
1131         my $msg = shift; # it is already HTML escaped
1132
1133         # to avoid infinite loop where error occurs in die_error,
1134         # change handler to default handler, disabling handle_errors_html
1135         set_message("Error occured when inside die_error:\n$msg");
1136
1137         # you cannot jump out of die_error when called as error handler;
1138         # the subroutine set via CGI::Carp::set_message is called _after_
1139         # HTTP headers are already written, so it cannot write them itself
1140         die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1141 }
1142 set_message(\&handle_errors_html);
1143
1144 # dispatch
1145 sub dispatch {
1146         if (!defined $action) {
1147                 if (defined $hash) {
1148                         $action = git_get_type($hash);
1149                         $action or die_error(404, "Object does not exist");
1150                 } elsif (defined $hash_base && defined $file_name) {
1151                         $action = git_get_type("$hash_base:$file_name");
1152                         $action or die_error(404, "File or directory does not exist");
1153                 } elsif (defined $project) {
1154                         $action = 'summary';
1155                 } else {
1156                         $action = 'project_list';
1157                 }
1158         }
1159         if (!defined($actions{$action})) {
1160                 die_error(400, "Unknown action");
1161         }
1162         if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1163             !$project) {
1164                 die_error(400, "Project needed");
1165         }
1166         $actions{$action}->();
1167 }
1168
1169 sub reset_timer {
1170         our $t0 = [ gettimeofday() ]
1171                 if defined $t0;
1172         our $number_of_git_cmds = 0;
1173 }
1174
1175 our $first_request = 1;
1176 sub run_request {
1177         reset_timer();
1178
1179         evaluate_uri();
1180         if ($first_request) {
1181                 evaluate_gitweb_config();
1182                 evaluate_git_version();
1183         }
1184         if ($per_request_config) {
1185                 if (ref($per_request_config) eq 'CODE') {
1186                         $per_request_config->();
1187                 } elsif (!$first_request) {
1188                         evaluate_gitweb_config();
1189                 }
1190         }
1191         check_loadavg();
1192
1193         # $projectroot and $projects_list might be set in gitweb config file
1194         $projects_list ||= $projectroot;
1195
1196         evaluate_query_params();
1197         evaluate_path_info();
1198         evaluate_and_validate_params();
1199         evaluate_git_dir();
1200
1201         configure_gitweb_features();
1202
1203         dispatch();
1204 }
1205
1206 our $is_last_request = sub { 1 };
1207 our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1208 our $CGI = 'CGI';
1209 our $cgi;
1210 sub configure_as_fcgi {
1211         require CGI::Fast;
1212         our $CGI = 'CGI::Fast';
1213
1214         my $request_number = 0;
1215         # let each child service 100 requests
1216         our $is_last_request = sub { ++$request_number > 100 };
1217 }
1218 sub evaluate_argv {
1219         my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1220         configure_as_fcgi()
1221                 if $script_name =~ /\.fcgi$/;
1222
1223         return unless (@ARGV);
1224
1225         require Getopt::Long;
1226         Getopt::Long::GetOptions(
1227                 'fastcgi|fcgi|f' => \&configure_as_fcgi,
1228                 'nproc|n=i' => sub {
1229                         my ($arg, $val) = @_;
1230                         return unless eval { require FCGI::ProcManager; 1; };
1231                         my $proc_manager = FCGI::ProcManager->new({
1232                                 n_processes => $val,
1233                         });
1234                         our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1235                         our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1236                         our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1237                 },
1238         );
1239 }
1240
1241 sub run {
1242         evaluate_argv();
1243
1244         $first_request = 1;
1245         $pre_listen_hook->()
1246                 if $pre_listen_hook;
1247
1248  REQUEST:
1249         while ($cgi = $CGI->new()) {
1250                 $pre_dispatch_hook->()
1251                         if $pre_dispatch_hook;
1252
1253                 run_request();
1254
1255                 $post_dispatch_hook->()
1256                         if $post_dispatch_hook;
1257                 $first_request = 0;
1258
1259                 last REQUEST if ($is_last_request->());
1260         }
1261
1262  DONE_GITWEB:
1263         1;
1264 }
1265
1266 run();
1267
1268 if (defined caller) {
1269         # wrapped in a subroutine processing requests,
1270         # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1271         return;
1272 } else {
1273         # pure CGI script, serving single request
1274         exit;
1275 }
1276
1277 ## ======================================================================
1278 ## action links
1279
1280 # possible values of extra options
1281 # -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1282 # -replay => 1      - start from a current view (replay with modifications)
1283 # -path_info => 0|1 - don't use/use path_info URL (if possible)
1284 # -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1285 sub href {
1286         my %params = @_;
1287         # default is to use -absolute url() i.e. $my_uri
1288         my $href = $params{-full} ? $my_url : $my_uri;
1289
1290         # implicit -replay, must be first of implicit params
1291         $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1292
1293         $params{'project'} = $project unless exists $params{'project'};
1294
1295         if ($params{-replay}) {
1296                 while (my ($name, $symbol) = each %cgi_param_mapping) {
1297                         if (!exists $params{$name}) {
1298                                 $params{$name} = $input_params{$name};
1299                         }
1300                 }
1301         }
1302
1303         my $use_pathinfo = gitweb_check_feature('pathinfo');
1304         if (defined $params{'project'} &&
1305             (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1306                 # try to put as many parameters as possible in PATH_INFO:
1307                 #   - project name
1308                 #   - action
1309                 #   - hash_parent or hash_parent_base:/file_parent
1310                 #   - hash or hash_base:/filename
1311                 #   - the snapshot_format as an appropriate suffix
1312
1313                 # When the script is the root DirectoryIndex for the domain,
1314                 # $href here would be something like http://gitweb.example.com/
1315                 # Thus, we strip any trailing / from $href, to spare us double
1316                 # slashes in the final URL
1317                 $href =~ s,/$,,;
1318
1319                 # Then add the project name, if present
1320                 $href .= "/".esc_path_info($params{'project'});
1321                 delete $params{'project'};
1322
1323                 # since we destructively absorb parameters, we keep this
1324                 # boolean that remembers if we're handling a snapshot
1325                 my $is_snapshot = $params{'action'} eq 'snapshot';
1326
1327                 # Summary just uses the project path URL, any other action is
1328                 # added to the URL
1329                 if (defined $params{'action'}) {
1330                         $href .= "/".esc_path_info($params{'action'})
1331                                 unless $params{'action'} eq 'summary';
1332                         delete $params{'action'};
1333                 }
1334
1335                 # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1336                 # stripping nonexistent or useless pieces
1337                 $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1338                         || $params{'hash_parent'} || $params{'hash'});
1339                 if (defined $params{'hash_base'}) {
1340                         if (defined $params{'hash_parent_base'}) {
1341                                 $href .= esc_path_info($params{'hash_parent_base'});
1342                                 # skip the file_parent if it's the same as the file_name
1343                                 if (defined $params{'file_parent'}) {
1344                                         if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1345                                                 delete $params{'file_parent'};
1346                                         } elsif ($params{'file_parent'} !~ /\.\./) {
1347                                                 $href .= ":/".esc_path_info($params{'file_parent'});
1348                                                 delete $params{'file_parent'};
1349                                         }
1350                                 }
1351                                 $href .= "..";
1352                                 delete $params{'hash_parent'};
1353                                 delete $params{'hash_parent_base'};
1354                         } elsif (defined $params{'hash_parent'}) {
1355                                 $href .= esc_path_info($params{'hash_parent'}). "..";
1356                                 delete $params{'hash_parent'};
1357                         }
1358
1359                         $href .= esc_path_info($params{'hash_base'});
1360                         if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1361                                 $href .= ":/".esc_path_info($params{'file_name'});
1362                                 delete $params{'file_name'};
1363                         }
1364                         delete $params{'hash'};
1365                         delete $params{'hash_base'};
1366                 } elsif (defined $params{'hash'}) {
1367                         $href .= esc_path_info($params{'hash'});
1368                         delete $params{'hash'};
1369                 }
1370
1371                 # If the action was a snapshot, we can absorb the
1372                 # snapshot_format parameter too
1373                 if ($is_snapshot) {
1374                         my $fmt = $params{'snapshot_format'};
1375                         # snapshot_format should always be defined when href()
1376                         # is called, but just in case some code forgets, we
1377                         # fall back to the default
1378                         $fmt ||= $snapshot_fmts[0];
1379                         $href .= $known_snapshot_formats{$fmt}{'suffix'};
1380                         delete $params{'snapshot_format'};
1381                 }
1382         }
1383
1384         # now encode the parameters explicitly
1385         my @result = ();
1386         for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1387                 my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1388                 if (defined $params{$name}) {
1389                         if (ref($params{$name}) eq "ARRAY") {
1390                                 foreach my $par (@{$params{$name}}) {
1391                                         push @result, $symbol . "=" . esc_param($par);
1392                                 }
1393                         } else {
1394                                 push @result, $symbol . "=" . esc_param($params{$name});
1395                         }
1396                 }
1397         }
1398         $href .= "?" . join(';', @result) if scalar @result;
1399
1400         # final transformation: trailing spaces must be escaped (URI-encoded)
1401         $href =~ s/(\s+)$/CGI::escape($1)/e;
1402
1403         if ($params{-anchor}) {
1404                 $href .= "#".esc_param($params{-anchor});
1405         }
1406
1407         return $href;
1408 }
1409
1410
1411 ## ======================================================================
1412 ## validation, quoting/unquoting and escaping
1413
1414 sub validate_action {
1415         my $input = shift || return undef;
1416         return undef unless exists $actions{$input};
1417         return $input;
1418 }
1419
1420 sub validate_project {
1421         my $input = shift || return undef;
1422         if (!validate_pathname($input) ||
1423                 !(-d "$projectroot/$input") ||
1424                 !check_export_ok("$projectroot/$input") ||
1425                 ($strict_export && !project_in_list($input))) {
1426                 return undef;
1427         } else {
1428                 return $input;
1429         }
1430 }
1431
1432 sub validate_pathname {
1433         my $input = shift || return undef;
1434
1435         # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1436         # at the beginning, at the end, and between slashes.
1437         # also this catches doubled slashes
1438         if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1439                 return undef;
1440         }
1441         # no null characters
1442         if ($input =~ m!\0!) {
1443                 return undef;
1444         }
1445         return $input;
1446 }
1447
1448 sub validate_refname {
1449         my $input = shift || return undef;
1450
1451         # textual hashes are O.K.
1452         if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1453                 return $input;
1454         }
1455         # it must be correct pathname
1456         $input = validate_pathname($input)
1457                 or return undef;
1458         # restrictions on ref name according to git-check-ref-format
1459         if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1460                 return undef;
1461         }
1462         return $input;
1463 }
1464
1465 # decode sequences of octets in utf8 into Perl's internal form,
1466 # which is utf-8 with utf8 flag set if needed.  gitweb writes out
1467 # in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1468 sub to_utf8 {
1469         my $str = shift;
1470         return undef unless defined $str;
1471
1472         if (utf8::is_utf8($str) || utf8::decode($str)) {
1473                 return $str;
1474         } else {
1475                 return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1476         }
1477 }
1478
1479 # quote unsafe chars, but keep the slash, even when it's not
1480 # correct, but quoted slashes look too horrible in bookmarks
1481 sub esc_param {
1482         my $str = shift;
1483         return undef unless defined $str;
1484         $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1485         $str =~ s/ /\+/g;
1486         return $str;
1487 }
1488
1489 # the quoting rules for path_info fragment are slightly different
1490 sub esc_path_info {
1491         my $str = shift;
1492         return undef unless defined $str;
1493
1494         # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1495         $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1496
1497         return $str;
1498 }
1499
1500 # quote unsafe chars in whole URL, so some characters cannot be quoted
1501 sub esc_url {
1502         my $str = shift;
1503         return undef unless defined $str;
1504         $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1505         $str =~ s/ /\+/g;
1506         return $str;
1507 }
1508
1509 # quote unsafe characters in HTML attributes
1510 sub esc_attr {
1511
1512         # for XHTML conformance escaping '"' to '&quot;' is not enough
1513         return esc_html(@_);
1514 }
1515
1516 # replace invalid utf8 character with SUBSTITUTION sequence
1517 sub esc_html {
1518         my $str = shift;
1519         my %opts = @_;
1520
1521         return undef unless defined $str;
1522
1523         $str = to_utf8($str);
1524         $str = $cgi->escapeHTML($str);
1525         if ($opts{'-nbsp'}) {
1526                 $str =~ s/ /&nbsp;/g;
1527         }
1528         $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1529         return $str;
1530 }
1531
1532 # quote control characters and escape filename to HTML
1533 sub esc_path {
1534         my $str = shift;
1535         my %opts = @_;
1536
1537         return undef unless defined $str;
1538
1539         $str = to_utf8($str);
1540         $str = $cgi->escapeHTML($str);
1541         if ($opts{'-nbsp'}) {
1542                 $str =~ s/ /&nbsp;/g;
1543         }
1544         $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1545         return $str;
1546 }
1547
1548 # Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1549 sub sanitize {
1550         my $str = shift;
1551
1552         return undef unless defined $str;
1553
1554         $str = to_utf8($str);
1555         $str =~ s|([[:cntrl:]])|($1 =~ /[\t\n\r]/ ? $1 : quot_cec($1))|eg;
1556         return $str;
1557 }
1558
1559 # Make control characters "printable", using character escape codes (CEC)
1560 sub quot_cec {
1561         my $cntrl = shift;
1562         my %opts = @_;
1563         my %es = ( # character escape codes, aka escape sequences
1564                 "\t" => '\t',   # tab            (HT)
1565                 "\n" => '\n',   # line feed      (LF)
1566                 "\r" => '\r',   # carrige return (CR)
1567                 "\f" => '\f',   # form feed      (FF)
1568                 "\b" => '\b',   # backspace      (BS)
1569                 "\a" => '\a',   # alarm (bell)   (BEL)
1570                 "\e" => '\e',   # escape         (ESC)
1571                 "\013" => '\v', # vertical tab   (VT)
1572                 "\000" => '\0', # nul character  (NUL)
1573         );
1574         my $chr = ( (exists $es{$cntrl})
1575                     ? $es{$cntrl}
1576                     : sprintf('\%2x', ord($cntrl)) );
1577         if ($opts{-nohtml}) {
1578                 return $chr;
1579         } else {
1580                 return "<span class=\"cntrl\">$chr</span>";
1581         }
1582 }
1583
1584 # Alternatively use unicode control pictures codepoints,
1585 # Unicode "printable representation" (PR)
1586 sub quot_upr {
1587         my $cntrl = shift;
1588         my %opts = @_;
1589
1590         my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1591         if ($opts{-nohtml}) {
1592                 return $chr;
1593         } else {
1594                 return "<span class=\"cntrl\">$chr</span>";
1595         }
1596 }
1597
1598 # git may return quoted and escaped filenames
1599 sub unquote {
1600         my $str = shift;
1601
1602         sub unq {
1603                 my $seq = shift;
1604                 my %es = ( # character escape codes, aka escape sequences
1605                         't' => "\t",   # tab            (HT, TAB)
1606                         'n' => "\n",   # newline        (NL)
1607                         'r' => "\r",   # return         (CR)
1608                         'f' => "\f",   # form feed      (FF)
1609                         'b' => "\b",   # backspace      (BS)
1610                         'a' => "\a",   # alarm (bell)   (BEL)
1611                         'e' => "\e",   # escape         (ESC)
1612                         'v' => "\013", # vertical tab   (VT)
1613                 );
1614
1615                 if ($seq =~ m/^[0-7]{1,3}$/) {
1616                         # octal char sequence
1617                         return chr(oct($seq));
1618                 } elsif (exists $es{$seq}) {
1619                         # C escape sequence, aka character escape code
1620                         return $es{$seq};
1621                 }
1622                 # quoted ordinary character
1623                 return $seq;
1624         }
1625
1626         if ($str =~ m/^"(.*)"$/) {
1627                 # needs unquoting
1628                 $str = $1;
1629                 $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1630         }
1631         return $str;
1632 }
1633
1634 # escape tabs (convert tabs to spaces)
1635 sub untabify {
1636         my $line = shift;
1637
1638         while ((my $pos = index($line, "\t")) != -1) {
1639                 if (my $count = (8 - ($pos % 8))) {
1640                         my $spaces = ' ' x $count;
1641                         $line =~ s/\t/$spaces/;
1642                 }
1643         }
1644
1645         return $line;
1646 }
1647
1648 sub project_in_list {
1649         my $project = shift;
1650         my @list = git_get_projects_list();
1651         return @list && scalar(grep { $_->{'path'} eq $project } @list);
1652 }
1653
1654 ## ----------------------------------------------------------------------
1655 ## HTML aware string manipulation
1656
1657 # Try to chop given string on a word boundary between position
1658 # $len and $len+$add_len. If there is no word boundary there,
1659 # chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1660 # (marking chopped part) would be longer than given string.
1661 sub chop_str {
1662         my $str = shift;
1663         my $len = shift;
1664         my $add_len = shift || 10;
1665         my $where = shift || 'right'; # 'left' | 'center' | 'right'
1666
1667         # Make sure perl knows it is utf8 encoded so we don't
1668         # cut in the middle of a utf8 multibyte char.
1669         $str = to_utf8($str);
1670
1671         # allow only $len chars, but don't cut a word if it would fit in $add_len
1672         # if it doesn't fit, cut it if it's still longer than the dots we would add
1673         # remove chopped character entities entirely
1674
1675         # when chopping in the middle, distribute $len into left and right part
1676         # return early if chopping wouldn't make string shorter
1677         if ($where eq 'center') {
1678                 return $str if ($len + 5 >= length($str)); # filler is length 5
1679                 $len = int($len/2);
1680         } else {
1681                 return $str if ($len + 4 >= length($str)); # filler is length 4
1682         }
1683
1684         # regexps: ending and beginning with word part up to $add_len
1685         my $endre = qr/.{$len}\w{0,$add_len}/;
1686         my $begre = qr/\w{0,$add_len}.{$len}/;
1687
1688         if ($where eq 'left') {
1689                 $str =~ m/^(.*?)($begre)$/;
1690                 my ($lead, $body) = ($1, $2);
1691                 if (length($lead) > 4) {
1692                         $lead = " ...";
1693                 }
1694                 return "$lead$body";
1695
1696         } elsif ($where eq 'center') {
1697                 $str =~ m/^($endre)(.*)$/;
1698                 my ($left, $str)  = ($1, $2);
1699                 $str =~ m/^(.*?)($begre)$/;
1700                 my ($mid, $right) = ($1, $2);
1701                 if (length($mid) > 5) {
1702                         $mid = " ... ";
1703                 }
1704                 return "$left$mid$right";
1705
1706         } else {
1707                 $str =~ m/^($endre)(.*)$/;
1708                 my $body = $1;
1709                 my $tail = $2;
1710                 if (length($tail) > 4) {
1711                         $tail = "... ";
1712                 }
1713                 return "$body$tail";
1714         }
1715 }
1716
1717 # takes the same arguments as chop_str, but also wraps a <span> around the
1718 # result with a title attribute if it does get chopped. Additionally, the
1719 # string is HTML-escaped.
1720 sub chop_and_escape_str {
1721         my ($str) = @_;
1722
1723         my $chopped = chop_str(@_);
1724         $str = to_utf8($str);
1725         if ($chopped eq $str) {
1726                 return esc_html($chopped);
1727         } else {
1728                 $str =~ s/[[:cntrl:]]/?/g;
1729                 return $cgi->span({-title=>$str}, esc_html($chopped));
1730         }
1731 }
1732
1733 # Highlight selected fragments of string, using given CSS class,
1734 # and escape HTML.  It is assumed that fragments do not overlap.
1735 # Regions are passed as list of pairs (array references).
1736 #
1737 # Example: esc_html_hl_regions("foobar", "mark", [ 0, 3 ]) returns
1738 # '<span class="mark">foo</span>bar'
1739 sub esc_html_hl_regions {
1740         my ($str, $css_class, @sel) = @_;
1741         my %opts = grep { ref($_) ne 'ARRAY' } @sel;
1742         @sel     = grep { ref($_) eq 'ARRAY' } @sel;
1743         return esc_html($str, %opts) unless @sel;
1744
1745         my $out = '';
1746         my $pos = 0;
1747
1748         for my $s (@sel) {
1749                 my ($begin, $end) = @$s;
1750
1751                 # Don't create empty <span> elements.
1752                 next if $end <= $begin;
1753
1754                 my $escaped = esc_html(substr($str, $begin, $end - $begin),
1755                                        %opts);
1756
1757                 $out .= esc_html(substr($str, $pos, $begin - $pos), %opts)
1758                         if ($begin - $pos > 0);
1759                 $out .= $cgi->span({-class => $css_class}, $escaped);
1760
1761                 $pos = $end;
1762         }
1763         $out .= esc_html(substr($str, $pos), %opts)
1764                 if ($pos < length($str));
1765
1766         return $out;
1767 }
1768
1769 # return positions of beginning and end of each match
1770 sub matchpos_list {
1771         my ($str, $regexp) = @_;
1772         return unless (defined $str && defined $regexp);
1773
1774         my @matches;
1775         while ($str =~ /$regexp/g) {
1776                 push @matches, [$-[0], $+[0]];
1777         }
1778         return @matches;
1779 }
1780
1781 # highlight match (if any), and escape HTML
1782 sub esc_html_match_hl {
1783         my ($str, $regexp) = @_;
1784         return esc_html($str) unless defined $regexp;
1785
1786         my @matches = matchpos_list($str, $regexp);
1787         return esc_html($str) unless @matches;
1788
1789         return esc_html_hl_regions($str, 'match', @matches);
1790 }
1791
1792
1793 # highlight match (if any) of shortened string, and escape HTML
1794 sub esc_html_match_hl_chopped {
1795         my ($str, $chopped, $regexp) = @_;
1796         return esc_html_match_hl($str, $regexp) unless defined $chopped;
1797
1798         my @matches = matchpos_list($str, $regexp);
1799         return esc_html($chopped) unless @matches;
1800
1801         # filter matches so that we mark chopped string
1802         my $tail = "... "; # see chop_str
1803         unless ($chopped =~ s/\Q$tail\E$//) {
1804                 $tail = '';
1805         }
1806         my $chop_len = length($chopped);
1807         my $tail_len = length($tail);
1808         my @filtered;
1809
1810         for my $m (@matches) {
1811                 if ($m->[0] > $chop_len) {
1812                         push @filtered, [ $chop_len, $chop_len + $tail_len ] if ($tail_len > 0);
1813                         last;
1814                 } elsif ($m->[1] > $chop_len) {
1815                         push @filtered, [ $m->[0], $chop_len + $tail_len ];
1816                         last;
1817                 }
1818                 push @filtered, $m;
1819         }
1820
1821         return esc_html_hl_regions($chopped . $tail, 'match', @filtered);
1822 }
1823
1824 ## ----------------------------------------------------------------------
1825 ## functions returning short strings
1826
1827 # CSS class for given age value (in seconds)
1828 sub age_class {
1829         my $age = shift;
1830
1831         if (!defined $age) {
1832                 return "noage";
1833         } elsif ($age < 60*60*2) {
1834                 return "age0";
1835         } elsif ($age < 60*60*24*2) {
1836                 return "age1";
1837         } else {
1838                 return "age2";
1839         }
1840 }
1841
1842 # convert age in seconds to "nn units ago" string
1843 sub age_string {
1844         my $age = shift;
1845         my $age_str;
1846
1847         if ($age > 60*60*24*365*2) {
1848                 $age_str = (int $age/60/60/24/365);
1849                 $age_str .= " years ago";
1850         } elsif ($age > 60*60*24*(365/12)*2) {
1851                 $age_str = int $age/60/60/24/(365/12);
1852                 $age_str .= " months ago";
1853         } elsif ($age > 60*60*24*7*2) {
1854                 $age_str = int $age/60/60/24/7;
1855                 $age_str .= " weeks ago";
1856         } elsif ($age > 60*60*24*2) {
1857                 $age_str = int $age/60/60/24;
1858                 $age_str .= " days ago";
1859         } elsif ($age > 60*60*2) {
1860                 $age_str = int $age/60/60;
1861                 $age_str .= " hours ago";
1862         } elsif ($age > 60*2) {
1863                 $age_str = int $age/60;
1864                 $age_str .= " min ago";
1865         } elsif ($age > 2) {
1866                 $age_str = int $age;
1867                 $age_str .= " sec ago";
1868         } else {
1869                 $age_str .= " right now";
1870         }
1871         return $age_str;
1872 }
1873
1874 use constant {
1875         S_IFINVALID => 0030000,
1876         S_IFGITLINK => 0160000,
1877 };
1878
1879 # submodule/subproject, a commit object reference
1880 sub S_ISGITLINK {
1881         my $mode = shift;
1882
1883         return (($mode & S_IFMT) == S_IFGITLINK)
1884 }
1885
1886 # convert file mode in octal to symbolic file mode string
1887 sub mode_str {
1888         my $mode = oct shift;
1889
1890         if (S_ISGITLINK($mode)) {
1891                 return 'm---------';
1892         } elsif (S_ISDIR($mode & S_IFMT)) {
1893                 return 'drwxr-xr-x';
1894         } elsif (S_ISLNK($mode)) {
1895                 return 'lrwxrwxrwx';
1896         } elsif (S_ISREG($mode)) {
1897                 # git cares only about the executable bit
1898                 if ($mode & S_IXUSR) {
1899                         return '-rwxr-xr-x';
1900                 } else {
1901                         return '-rw-r--r--';
1902                 };
1903         } else {
1904                 return '----------';
1905         }
1906 }
1907
1908 # convert file mode in octal to file type string
1909 sub file_type {
1910         my $mode = shift;
1911
1912         if ($mode !~ m/^[0-7]+$/) {
1913                 return $mode;
1914         } else {
1915                 $mode = oct $mode;
1916         }
1917
1918         if (S_ISGITLINK($mode)) {
1919                 return "submodule";
1920         } elsif (S_ISDIR($mode & S_IFMT)) {
1921                 return "directory";
1922         } elsif (S_ISLNK($mode)) {
1923                 return "symlink";
1924         } elsif (S_ISREG($mode)) {
1925                 return "file";
1926         } else {
1927                 return "unknown";
1928         }
1929 }
1930
1931 # convert file mode in octal to file type description string
1932 sub file_type_long {
1933         my $mode = shift;
1934
1935         if ($mode !~ m/^[0-7]+$/) {
1936                 return $mode;
1937         } else {
1938                 $mode = oct $mode;
1939         }
1940
1941         if (S_ISGITLINK($mode)) {
1942                 return "submodule";
1943         } elsif (S_ISDIR($mode & S_IFMT)) {
1944                 return "directory";
1945         } elsif (S_ISLNK($mode)) {
1946                 return "symlink";
1947         } elsif (S_ISREG($mode)) {
1948                 if ($mode & S_IXUSR) {
1949                         return "executable";
1950                 } else {
1951                         return "file";
1952                 };
1953         } else {
1954                 return "unknown";
1955         }
1956 }
1957
1958
1959 ## ----------------------------------------------------------------------
1960 ## functions returning short HTML fragments, or transforming HTML fragments
1961 ## which don't belong to other sections
1962
1963 # format line of commit message.
1964 sub format_log_line_html {
1965         my $line = shift;
1966
1967         $line = esc_html($line, -nbsp=>1);
1968         $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1969                 $cgi->a({-href => href(action=>"object", hash=>$1),
1970                                         -class => "text"}, $1);
1971         }eg;
1972
1973         return $line;
1974 }
1975
1976 # format marker of refs pointing to given object
1977
1978 # the destination action is chosen based on object type and current context:
1979 # - for annotated tags, we choose the tag view unless it's the current view
1980 #   already, in which case we go to shortlog view
1981 # - for other refs, we keep the current view if we're in history, shortlog or
1982 #   log view, and select shortlog otherwise
1983 sub format_ref_marker {
1984         my ($refs, $id) = @_;
1985         my $markers = '';
1986
1987         if (defined $refs->{$id}) {
1988                 foreach my $ref (@{$refs->{$id}}) {
1989                         # this code exploits the fact that non-lightweight tags are the
1990                         # only indirect objects, and that they are the only objects for which
1991                         # we want to use tag instead of shortlog as action
1992                         my ($type, $name) = qw();
1993                         my $indirect = ($ref =~ s/\^\{\}$//);
1994                         # e.g. tags/v2.6.11 or heads/next
1995                         if ($ref =~ m!^(.*?)s?/(.*)$!) {
1996                                 $type = $1;
1997                                 $name = $2;
1998                         } else {
1999                                 $type = "ref";
2000                                 $name = $ref;
2001                         }
2002
2003                         my $class = $type;
2004                         $class .= " indirect" if $indirect;
2005
2006                         my $dest_action = "shortlog";
2007
2008                         if ($indirect) {
2009                                 $dest_action = "tag" unless $action eq "tag";
2010                         } elsif ($action =~ /^(history|(short)?log)$/) {
2011                                 $dest_action = $action;
2012                         }
2013
2014                         my $dest = "";
2015                         $dest .= "refs/" unless $ref =~ m!^refs/!;
2016                         $dest .= $ref;
2017
2018                         my $link = $cgi->a({
2019                                 -href => href(
2020                                         action=>$dest_action,
2021                                         hash=>$dest
2022                                 )}, $name);
2023
2024                         $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
2025                                 $link . "</span>";
2026                 }
2027         }
2028
2029         if ($markers) {
2030                 return ' <span class="refs">'. $markers . '</span>';
2031         } else {
2032                 return "";
2033         }
2034 }
2035
2036 # format, perhaps shortened and with markers, title line
2037 sub format_subject_html {
2038         my ($long, $short, $href, $extra) = @_;
2039         $extra = '' unless defined($extra);
2040
2041         if (length($short) < length($long)) {
2042                 $long =~ s/[[:cntrl:]]/?/g;
2043                 return $cgi->a({-href => $href, -class => "list subject",
2044                                 -title => to_utf8($long)},
2045                        esc_html($short)) . $extra;
2046         } else {
2047                 return $cgi->a({-href => $href, -class => "list subject"},
2048                        esc_html($long)) . $extra;
2049         }
2050 }
2051
2052 # Rather than recomputing the url for an email multiple times, we cache it
2053 # after the first hit. This gives a visible benefit in views where the avatar
2054 # for the same email is used repeatedly (e.g. shortlog).
2055 # The cache is shared by all avatar engines (currently gravatar only), which
2056 # are free to use it as preferred. Since only one avatar engine is used for any
2057 # given page, there's no risk for cache conflicts.
2058 our %avatar_cache = ();
2059
2060 # Compute the picon url for a given email, by using the picon search service over at
2061 # http://www.cs.indiana.edu/picons/search.html
2062 sub picon_url {
2063         my $email = lc shift;
2064         if (!$avatar_cache{$email}) {
2065                 my ($user, $domain) = split('@', $email);
2066                 $avatar_cache{$email} =
2067                         "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
2068                         "$domain/$user/" .
2069                         "users+domains+unknown/up/single";
2070         }
2071         return $avatar_cache{$email};
2072 }
2073
2074 # Compute the gravatar url for a given email, if it's not in the cache already.
2075 # Gravatar stores only the part of the URL before the size, since that's the
2076 # one computationally more expensive. This also allows reuse of the cache for
2077 # different sizes (for this particular engine).
2078 sub gravatar_url {
2079         my $email = lc shift;
2080         my $size = shift;
2081         $avatar_cache{$email} ||=
2082                 "http://www.gravatar.com/avatar/" .
2083                         Digest::MD5::md5_hex($email) . "?s=";
2084         return $avatar_cache{$email} . $size;
2085 }
2086
2087 # Insert an avatar for the given $email at the given $size if the feature
2088 # is enabled.
2089 sub git_get_avatar {
2090         my ($email, %opts) = @_;
2091         my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
2092         my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
2093         $opts{-size} ||= 'default';
2094         my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
2095         my $url = "";
2096         if ($git_avatar eq 'gravatar') {
2097                 $url = gravatar_url($email, $size);
2098         } elsif ($git_avatar eq 'picon') {
2099                 $url = picon_url($email);
2100         }
2101         # Other providers can be added by extending the if chain, defining $url
2102         # as needed. If no variant puts something in $url, we assume avatars
2103         # are completely disabled/unavailable.
2104         if ($url) {
2105                 return $pre_white .
2106                        "<img width=\"$size\" " .
2107                             "class=\"avatar\" " .
2108                             "src=\"".esc_url($url)."\" " .
2109                             "alt=\"\" " .
2110                        "/>" . $post_white;
2111         } else {
2112                 return "";
2113         }
2114 }
2115
2116 sub format_search_author {
2117         my ($author, $searchtype, $displaytext) = @_;
2118         my $have_search = gitweb_check_feature('search');
2119
2120         if ($have_search) {
2121                 my $performed = "";
2122                 if ($searchtype eq 'author') {
2123                         $performed = "authored";
2124                 } elsif ($searchtype eq 'committer') {
2125                         $performed = "committed";
2126                 }
2127
2128                 return $cgi->a({-href => href(action=>"search", hash=>$hash,
2129                                 searchtext=>$author,
2130                                 searchtype=>$searchtype), class=>"list",
2131                                 title=>"Search for commits $performed by $author"},
2132                                 $displaytext);
2133
2134         } else {
2135                 return $displaytext;
2136         }
2137 }
2138
2139 # format the author name of the given commit with the given tag
2140 # the author name is chopped and escaped according to the other
2141 # optional parameters (see chop_str).
2142 sub format_author_html {
2143         my $tag = shift;
2144         my $co = shift;
2145         my $author = chop_and_escape_str($co->{'author_name'}, @_);
2146         return "<$tag class=\"author\">" .
2147                format_search_author($co->{'author_name'}, "author",
2148                        git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2149                        $author) .
2150                "</$tag>";
2151 }
2152
2153 # format git diff header line, i.e. "diff --(git|combined|cc) ..."
2154 sub format_git_diff_header_line {
2155         my $line = shift;
2156         my $diffinfo = shift;
2157         my ($from, $to) = @_;
2158
2159         if ($diffinfo->{'nparents'}) {
2160                 # combined diff
2161                 $line =~ s!^(diff (.*?) )"?.*$!$1!;
2162                 if ($to->{'href'}) {
2163                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2164                                          esc_path($to->{'file'}));
2165                 } else { # file was deleted (no href)
2166                         $line .= esc_path($to->{'file'});
2167                 }
2168         } else {
2169                 # "ordinary" diff
2170                 $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2171                 if ($from->{'href'}) {
2172                         $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2173                                          'a/' . esc_path($from->{'file'}));
2174                 } else { # file was added (no href)
2175                         $line .= 'a/' . esc_path($from->{'file'});
2176                 }
2177                 $line .= ' ';
2178                 if ($to->{'href'}) {
2179                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2180                                          'b/' . esc_path($to->{'file'}));
2181                 } else { # file was deleted
2182                         $line .= 'b/' . esc_path($to->{'file'});
2183                 }
2184         }
2185
2186         return "<div class=\"diff header\">$line</div>\n";
2187 }
2188
2189 # format extended diff header line, before patch itself
2190 sub format_extended_diff_header_line {
2191         my $line = shift;
2192         my $diffinfo = shift;
2193         my ($from, $to) = @_;
2194
2195         # match <path>
2196         if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2197                 $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2198                                        esc_path($from->{'file'}));
2199         }
2200         if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2201                 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2202                                  esc_path($to->{'file'}));
2203         }
2204         # match single <mode>
2205         if ($line =~ m/\s(\d{6})$/) {
2206                 $line .= '<span class="info"> (' .
2207                          file_type_long($1) .
2208                          ')</span>';
2209         }
2210         # match <hash>
2211         if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2212                 # can match only for combined diff
2213                 $line = 'index ';
2214                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2215                         if ($from->{'href'}[$i]) {
2216                                 $line .= $cgi->a({-href=>$from->{'href'}[$i],
2217                                                   -class=>"hash"},
2218                                                  substr($diffinfo->{'from_id'}[$i],0,7));
2219                         } else {
2220                                 $line .= '0' x 7;
2221                         }
2222                         # separator
2223                         $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2224                 }
2225                 $line .= '..';
2226                 if ($to->{'href'}) {
2227                         $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2228                                          substr($diffinfo->{'to_id'},0,7));
2229                 } else {
2230                         $line .= '0' x 7;
2231                 }
2232
2233         } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2234                 # can match only for ordinary diff
2235                 my ($from_link, $to_link);
2236                 if ($from->{'href'}) {
2237                         $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2238                                              substr($diffinfo->{'from_id'},0,7));
2239                 } else {
2240                         $from_link = '0' x 7;
2241                 }
2242                 if ($to->{'href'}) {
2243                         $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2244                                            substr($diffinfo->{'to_id'},0,7));
2245                 } else {
2246                         $to_link = '0' x 7;
2247                 }
2248                 my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2249                 $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2250         }
2251
2252         return $line . "<br/>\n";
2253 }
2254
2255 # format from-file/to-file diff header
2256 sub format_diff_from_to_header {
2257         my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2258         my $line;
2259         my $result = '';
2260
2261         $line = $from_line;
2262         #assert($line =~ m/^---/) if DEBUG;
2263         # no extra formatting for "^--- /dev/null"
2264         if (! $diffinfo->{'nparents'}) {
2265                 # ordinary (single parent) diff
2266                 if ($line =~ m!^--- "?a/!) {
2267                         if ($from->{'href'}) {
2268                                 $line = '--- a/' .
2269                                         $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2270                                                 esc_path($from->{'file'}));
2271                         } else {
2272                                 $line = '--- a/' .
2273                                         esc_path($from->{'file'});
2274                         }
2275                 }
2276                 $result .= qq!<div class="diff from_file">$line</div>\n!;
2277
2278         } else {
2279                 # combined diff (merge commit)
2280                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2281                         if ($from->{'href'}[$i]) {
2282                                 $line = '--- ' .
2283                                         $cgi->a({-href=>href(action=>"blobdiff",
2284                                                              hash_parent=>$diffinfo->{'from_id'}[$i],
2285                                                              hash_parent_base=>$parents[$i],
2286                                                              file_parent=>$from->{'file'}[$i],
2287                                                              hash=>$diffinfo->{'to_id'},
2288                                                              hash_base=>$hash,
2289                                                              file_name=>$to->{'file'}),
2290                                                  -class=>"path",
2291                                                  -title=>"diff" . ($i+1)},
2292                                                 $i+1) .
2293                                         '/' .
2294                                         $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2295                                                 esc_path($from->{'file'}[$i]));
2296                         } else {
2297                                 $line = '--- /dev/null';
2298                         }
2299                         $result .= qq!<div class="diff from_file">$line</div>\n!;
2300                 }
2301         }
2302
2303         $line = $to_line;
2304         #assert($line =~ m/^\+\+\+/) if DEBUG;
2305         # no extra formatting for "^+++ /dev/null"
2306         if ($line =~ m!^\+\+\+ "?b/!) {
2307                 if ($to->{'href'}) {
2308                         $line = '+++ b/' .
2309                                 $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2310                                         esc_path($to->{'file'}));
2311                 } else {
2312                         $line = '+++ b/' .
2313                                 esc_path($to->{'file'});
2314                 }
2315         }
2316         $result .= qq!<div class="diff to_file">$line</div>\n!;
2317
2318         return $result;
2319 }
2320
2321 # create note for patch simplified by combined diff
2322 sub format_diff_cc_simplified {
2323         my ($diffinfo, @parents) = @_;
2324         my $result = '';
2325
2326         $result .= "<div class=\"diff header\">" .
2327                    "diff --cc ";
2328         if (!is_deleted($diffinfo)) {
2329                 $result .= $cgi->a({-href => href(action=>"blob",
2330                                                   hash_base=>$hash,
2331                                                   hash=>$diffinfo->{'to_id'},
2332                                                   file_name=>$diffinfo->{'to_file'}),
2333                                     -class => "path"},
2334                                    esc_path($diffinfo->{'to_file'}));
2335         } else {
2336                 $result .= esc_path($diffinfo->{'to_file'});
2337         }
2338         $result .= "</div>\n" . # class="diff header"
2339                    "<div class=\"diff nodifferences\">" .
2340                    "Simple merge" .
2341                    "</div>\n"; # class="diff nodifferences"
2342
2343         return $result;
2344 }
2345
2346 sub diff_line_class {
2347         my ($line, $from, $to) = @_;
2348
2349         # ordinary diff
2350         my $num_sign = 1;
2351         # combined diff
2352         if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2353                 $num_sign = scalar @{$from->{'href'}};
2354         }
2355
2356         my @diff_line_classifier = (
2357                 { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2358                 { regexp => qr/^\\/,               class => "incomplete"  },
2359                 { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2360                 # classifier for context must come before classifier add/rem,
2361                 # or we would have to use more complicated regexp, for example
2362                 # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2363                 { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2364                 { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2365         );
2366         for my $clsfy (@diff_line_classifier) {
2367                 return $clsfy->{'class'}
2368                         if ($line =~ $clsfy->{'regexp'});
2369         }
2370
2371         # fallback
2372         return "";
2373 }
2374
2375 # assumes that $from and $to are defined and correctly filled,
2376 # and that $line holds a line of chunk header for unified diff
2377 sub format_unidiff_chunk_header {
2378         my ($line, $from, $to) = @_;
2379
2380         my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2381                 $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2382
2383         $from_lines = 0 unless defined $from_lines;
2384         $to_lines   = 0 unless defined $to_lines;
2385
2386         if ($from->{'href'}) {
2387                 $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2388                                      -class=>"list"}, $from_text);
2389         }
2390         if ($to->{'href'}) {
2391                 $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2392                                      -class=>"list"}, $to_text);
2393         }
2394         $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2395                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2396         return $line;
2397 }
2398
2399 # assumes that $from and $to are defined and correctly filled,
2400 # and that $line holds a line of chunk header for combined diff
2401 sub format_cc_diff_chunk_header {
2402         my ($line, $from, $to) = @_;
2403
2404         my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2405         my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2406
2407         @from_text = split(' ', $ranges);
2408         for (my $i = 0; $i < @from_text; ++$i) {
2409                 ($from_start[$i], $from_nlines[$i]) =
2410                         (split(',', substr($from_text[$i], 1)), 0);
2411         }
2412
2413         $to_text   = pop @from_text;
2414         $to_start  = pop @from_start;
2415         $to_nlines = pop @from_nlines;
2416
2417         $line = "<span class=\"chunk_info\">$prefix ";
2418         for (my $i = 0; $i < @from_text; ++$i) {
2419                 if ($from->{'href'}[$i]) {
2420                         $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2421                                           -class=>"list"}, $from_text[$i]);
2422                 } else {
2423                         $line .= $from_text[$i];
2424                 }
2425                 $line .= " ";
2426         }
2427         if ($to->{'href'}) {
2428                 $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2429                                   -class=>"list"}, $to_text);
2430         } else {
2431                 $line .= $to_text;
2432         }
2433         $line .= " $prefix</span>" .
2434                  "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2435         return $line;
2436 }
2437
2438 # process patch (diff) line (not to be used for diff headers),
2439 # returning HTML-formatted (but not wrapped) line.
2440 # If the line is passed as a reference, it is treated as HTML and not
2441 # esc_html()'ed.
2442 sub format_diff_line {
2443         my ($line, $diff_class, $from, $to) = @_;
2444
2445         if (ref($line)) {
2446                 $line = $$line;
2447         } else {
2448                 chomp $line;
2449                 $line = untabify($line);
2450
2451                 if ($from && $to && $line =~ m/^\@{2} /) {
2452                         $line = format_unidiff_chunk_header($line, $from, $to);
2453                 } elsif ($from && $to && $line =~ m/^\@{3}/) {
2454                         $line = format_cc_diff_chunk_header($line, $from, $to);
2455                 } else {
2456                         $line = esc_html($line, -nbsp=>1);
2457                 }
2458         }
2459
2460         my $diff_classes = "diff";
2461         $diff_classes .= " $diff_class" if ($diff_class);
2462         $line = "<div class=\"$diff_classes\">$line</div>\n";
2463
2464         return $line;
2465 }
2466
2467 # Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2468 # linked.  Pass the hash of the tree/commit to snapshot.
2469 sub format_snapshot_links {
2470         my ($hash) = @_;
2471         my $num_fmts = @snapshot_fmts;
2472         if ($num_fmts > 1) {
2473                 # A parenthesized list of links bearing format names.
2474                 # e.g. "snapshot (_tar.gz_ _zip_)"
2475                 return "snapshot (" . join(' ', map
2476                         $cgi->a({
2477                                 -href => href(
2478                                         action=>"snapshot",
2479                                         hash=>$hash,
2480                                         snapshot_format=>$_
2481                                 )
2482                         }, $known_snapshot_formats{$_}{'display'})
2483                 , @snapshot_fmts) . ")";
2484         } elsif ($num_fmts == 1) {
2485                 # A single "snapshot" link whose tooltip bears the format name.
2486                 # i.e. "_snapshot_"
2487                 my ($fmt) = @snapshot_fmts;
2488                 return
2489                         $cgi->a({
2490                                 -href => href(
2491                                         action=>"snapshot",
2492                                         hash=>$hash,
2493                                         snapshot_format=>$fmt
2494                                 ),
2495                                 -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2496                         }, "snapshot");
2497         } else { # $num_fmts == 0
2498                 return undef;
2499         }
2500 }
2501
2502 ## ......................................................................
2503 ## functions returning values to be passed, perhaps after some
2504 ## transformation, to other functions; e.g. returning arguments to href()
2505
2506 # returns hash to be passed to href to generate gitweb URL
2507 # in -title key it returns description of link
2508 sub get_feed_info {
2509         my $format = shift || 'Atom';
2510         my %res = (action => lc($format));
2511
2512         # feed links are possible only for project views
2513         return unless (defined $project);
2514         # some views should link to OPML, or to generic project feed,
2515         # or don't have specific feed yet (so they should use generic)
2516         return if (!$action || $action =~ /^(?:tags|heads|forks|tag|search)$/x);
2517
2518         my $branch;
2519         # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2520         # from tag links; this also makes possible to detect branch links
2521         if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2522             (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2523                 $branch = $1;
2524         }
2525         # find log type for feed description (title)
2526         my $type = 'log';
2527         if (defined $file_name) {
2528                 $type  = "history of $file_name";
2529                 $type .= "/" if ($action eq 'tree');
2530                 $type .= " on '$branch'" if (defined $branch);
2531         } else {
2532                 $type = "log of $branch" if (defined $branch);
2533         }
2534
2535         $res{-title} = $type;
2536         $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2537         $res{'file_name'} = $file_name;
2538
2539         return %res;
2540 }
2541
2542 ## ----------------------------------------------------------------------
2543 ## git utility subroutines, invoking git commands
2544
2545 # returns path to the core git executable and the --git-dir parameter as list
2546 sub git_cmd {
2547         $number_of_git_cmds++;
2548         return $GIT, '--git-dir='.$git_dir;
2549 }
2550
2551 # quote the given arguments for passing them to the shell
2552 # quote_command("command", "arg 1", "arg with ' and ! characters")
2553 # => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2554 # Try to avoid using this function wherever possible.
2555 sub quote_command {
2556         return join(' ',
2557                 map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2558 }
2559
2560 # get HEAD ref of given project as hash
2561 sub git_get_head_hash {
2562         return git_get_full_hash(shift, 'HEAD');
2563 }
2564
2565 sub git_get_full_hash {
2566         return git_get_hash(@_);
2567 }
2568
2569 sub git_get_short_hash {
2570         return git_get_hash(@_, '--short=7');
2571 }
2572
2573 sub git_get_hash {
2574         my ($project, $hash, @options) = @_;
2575         my $o_git_dir = $git_dir;
2576         my $retval = undef;
2577         $git_dir = "$projectroot/$project";
2578         if (open my $fd, '-|', git_cmd(), 'rev-parse',
2579             '--verify', '-q', @options, $hash) {
2580                 $retval = <$fd>;
2581                 chomp $retval if defined $retval;
2582                 close $fd;
2583         }
2584         if (defined $o_git_dir) {
2585                 $git_dir = $o_git_dir;
2586         }
2587         return $retval;
2588 }
2589
2590 # get type of given object
2591 sub git_get_type {
2592         my $hash = shift;
2593
2594         open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2595         my $type = <$fd>;
2596         close $fd or return;
2597         chomp $type;
2598         return $type;
2599 }
2600
2601 # repository configuration
2602 our $config_file = '';
2603 our %config;
2604
2605 # store multiple values for single key as anonymous array reference
2606 # single values stored directly in the hash, not as [ <value> ]
2607 sub hash_set_multi {
2608         my ($hash, $key, $value) = @_;
2609
2610         if (!exists $hash->{$key}) {
2611                 $hash->{$key} = $value;
2612         } elsif (!ref $hash->{$key}) {
2613                 $hash->{$key} = [ $hash->{$key}, $value ];
2614         } else {
2615                 push @{$hash->{$key}}, $value;
2616         }
2617 }
2618
2619 # return hash of git project configuration
2620 # optionally limited to some section, e.g. 'gitweb'
2621 sub git_parse_project_config {
2622         my $section_regexp = shift;
2623         my %config;
2624
2625         local $/ = "\0";
2626
2627         open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2628                 or return;
2629
2630         while (my $keyval = <$fh>) {
2631                 chomp $keyval;
2632                 my ($key, $value) = split(/\n/, $keyval, 2);
2633
2634                 hash_set_multi(\%config, $key, $value)
2635                         if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2636         }
2637         close $fh;
2638
2639         return %config;
2640 }
2641
2642 # convert config value to boolean: 'true' or 'false'
2643 # no value, number > 0, 'true' and 'yes' values are true
2644 # rest of values are treated as false (never as error)
2645 sub config_to_bool {
2646         my $val = shift;
2647
2648         return 1 if !defined $val;             # section.key
2649
2650         # strip leading and trailing whitespace
2651         $val =~ s/^\s+//;
2652         $val =~ s/\s+$//;
2653
2654         return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2655                 ($val =~ /^(?:true|yes)$/i));  # section.key = true
2656 }
2657
2658 # convert config value to simple decimal number
2659 # an optional value suffix of 'k', 'm', or 'g' will cause the value
2660 # to be multiplied by 1024, 1048576, or 1073741824
2661 sub config_to_int {
2662         my $val = shift;
2663
2664         # strip leading and trailing whitespace
2665         $val =~ s/^\s+//;
2666         $val =~ s/\s+$//;
2667
2668         if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2669                 $unit = lc($unit);
2670                 # unknown unit is treated as 1
2671                 return $num * ($unit eq 'g' ? 1073741824 :
2672                                $unit eq 'm' ?    1048576 :
2673                                $unit eq 'k' ?       1024 : 1);
2674         }
2675         return $val;
2676 }
2677
2678 # convert config value to array reference, if needed
2679 sub config_to_multi {
2680         my $val = shift;
2681
2682         return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2683 }
2684
2685 sub git_get_project_config {
2686         my ($key, $type) = @_;
2687
2688         return unless defined $git_dir;
2689
2690         # key sanity check
2691         return unless ($key);
2692         # only subsection, if exists, is case sensitive,
2693         # and not lowercased by 'git config -z -l'
2694         if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2695                 $key = join(".", lc($hi), $mi, lc($lo));
2696         } else {
2697                 $key = lc($key);
2698         }
2699         $key =~ s/^gitweb\.//;
2700         return if ($key =~ m/\W/);
2701
2702         # type sanity check
2703         if (defined $type) {
2704                 $type =~ s/^--//;
2705                 $type = undef
2706                         unless ($type eq 'bool' || $type eq 'int');
2707         }
2708
2709         # get config
2710         if (!defined $config_file ||
2711             $config_file ne "$git_dir/config") {
2712                 %config = git_parse_project_config('gitweb');
2713                 $config_file = "$git_dir/config";
2714         }
2715
2716         # check if config variable (key) exists
2717         return unless exists $config{"gitweb.$key"};
2718
2719         # ensure given type
2720         if (!defined $type) {
2721                 return $config{"gitweb.$key"};
2722         } elsif ($type eq 'bool') {
2723                 # backward compatibility: 'git config --bool' returns true/false
2724                 return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2725         } elsif ($type eq 'int') {
2726                 return config_to_int($config{"gitweb.$key"});
2727         }
2728         return $config{"gitweb.$key"};
2729 }
2730
2731 # get hash of given path at given ref
2732 sub git_get_hash_by_path {
2733         my $base = shift;
2734         my $path = shift || return undef;
2735         my $type = shift;
2736
2737         $path =~ s,/+$,,;
2738
2739         open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2740                 or die_error(500, "Open git-ls-tree failed");
2741         my $line = <$fd>;
2742         close $fd or return undef;
2743
2744         if (!defined $line) {
2745                 # there is no tree or hash given by $path at $base
2746                 return undef;
2747         }
2748
2749         #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2750         $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2751         if (defined $type && $type ne $2) {
2752                 # type doesn't match
2753                 return undef;
2754         }
2755         return $3;
2756 }
2757
2758 # get path of entry with given hash at given tree-ish (ref)
2759 # used to get 'from' filename for combined diff (merge commit) for renames
2760 sub git_get_path_by_hash {
2761         my $base = shift || return;
2762         my $hash = shift || return;
2763
2764         local $/ = "\0";
2765
2766         open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2767                 or return undef;
2768         while (my $line = <$fd>) {
2769                 chomp $line;
2770
2771                 #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2772                 #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2773                 if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2774                         close $fd;
2775                         return $1;
2776                 }
2777         }
2778         close $fd;
2779         return undef;
2780 }
2781
2782 ## ......................................................................
2783 ## git utility functions, directly accessing git repository
2784
2785 # get the value of config variable either from file named as the variable
2786 # itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2787 # configuration variable in the repository config file.
2788 sub git_get_file_or_project_config {
2789         my ($path, $name) = @_;
2790
2791         $git_dir = "$projectroot/$path";
2792         open my $fd, '<', "$git_dir/$name"
2793                 or return git_get_project_config($name);
2794         my $conf = <$fd>;
2795         close $fd;
2796         if (defined $conf) {
2797                 chomp $conf;
2798         }
2799         return $conf;
2800 }
2801
2802 sub git_get_project_description {
2803         my $path = shift;
2804         return git_get_file_or_project_config($path, 'description');
2805 }
2806
2807 sub git_get_project_category {
2808         my $path = shift;
2809         return git_get_file_or_project_config($path, 'category');
2810 }
2811
2812
2813 # supported formats:
2814 # * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2815 #   - if its contents is a number, use it as tag weight,
2816 #   - otherwise add a tag with weight 1
2817 # * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2818 #   the same value multiple times increases tag weight
2819 # * `gitweb.ctag' multi-valued repo config variable
2820 sub git_get_project_ctags {
2821         my $project = shift;
2822         my $ctags = {};
2823
2824         $git_dir = "$projectroot/$project";
2825         if (opendir my $dh, "$git_dir/ctags") {
2826                 my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2827                 foreach my $tagfile (@files) {
2828                         open my $ct, '<', $tagfile
2829                                 or next;
2830                         my $val = <$ct>;
2831                         chomp $val if $val;
2832                         close $ct;
2833
2834                         (my $ctag = $tagfile) =~ s#.*/##;
2835                         if ($val =~ /^\d+$/) {
2836                                 $ctags->{$ctag} = $val;
2837                         } else {
2838                                 $ctags->{$ctag} = 1;
2839                         }
2840                 }
2841                 closedir $dh;
2842
2843         } elsif (open my $fh, '<', "$git_dir/ctags") {
2844                 while (my $line = <$fh>) {
2845                         chomp $line;
2846                         $ctags->{$line}++ if $line;
2847                 }
2848                 close $fh;
2849
2850         } else {
2851                 my $taglist = config_to_multi(git_get_project_config('ctag'));
2852                 foreach my $tag (@$taglist) {
2853                         $ctags->{$tag}++;
2854                 }
2855         }
2856
2857         return $ctags;
2858 }
2859
2860 # return hash, where keys are content tags ('ctags'),
2861 # and values are sum of weights of given tag in every project
2862 sub git_gather_all_ctags {
2863         my $projects = shift;
2864         my $ctags = {};
2865
2866         foreach my $p (@$projects) {
2867                 foreach my $ct (keys %{$p->{'ctags'}}) {
2868                         $ctags->{$ct} += $p->{'ctags'}->{$ct};
2869                 }
2870         }
2871
2872         return $ctags;
2873 }
2874
2875 sub git_populate_project_tagcloud {
2876         my $ctags = shift;
2877
2878         # First, merge different-cased tags; tags vote on casing
2879         my %ctags_lc;
2880         foreach (keys %$ctags) {
2881                 $ctags_lc{lc $_}->{count} += $ctags->{$_};
2882                 if (not $ctags_lc{lc $_}->{topcount}
2883                     or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2884                         $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2885                         $ctags_lc{lc $_}->{topname} = $_;
2886                 }
2887         }
2888
2889         my $cloud;
2890         my $matched = $input_params{'ctag'};
2891         if (eval { require HTML::TagCloud; 1; }) {
2892                 $cloud = HTML::TagCloud->new;
2893                 foreach my $ctag (sort keys %ctags_lc) {
2894                         # Pad the title with spaces so that the cloud looks
2895                         # less crammed.
2896                         my $title = esc_html($ctags_lc{$ctag}->{topname});
2897                         $title =~ s/ /&nbsp;/g;
2898                         $title =~ s/^/&nbsp;/g;
2899                         $title =~ s/$/&nbsp;/g;
2900                         if (defined $matched && $matched eq $ctag) {
2901                                 $title = qq(<span class="match">$title</span>);
2902                         }
2903                         $cloud->add($title, href(project=>undef, ctag=>$ctag),
2904                                     $ctags_lc{$ctag}->{count});
2905                 }
2906         } else {
2907                 $cloud = {};
2908                 foreach my $ctag (keys %ctags_lc) {
2909                         my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2910                         if (defined $matched && $matched eq $ctag) {
2911                                 $title = qq(<span class="match">$title</span>);
2912                         }
2913                         $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2914                         $cloud->{$ctag}{ctag} =
2915                                 $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2916                 }
2917         }
2918         return $cloud;
2919 }
2920
2921 sub git_show_project_tagcloud {
2922         my ($cloud, $count) = @_;
2923         if (ref $cloud eq 'HTML::TagCloud') {
2924                 return $cloud->html_and_css($count);
2925         } else {
2926                 my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2927                 return
2928                         '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2929                         join (', ', map {
2930                                 $cloud->{$_}->{'ctag'}
2931                         } splice(@tags, 0, $count)) .
2932                         '</div>';
2933         }
2934 }
2935
2936 sub git_get_project_url_list {
2937         my $path = shift;
2938
2939         $git_dir = "$projectroot/$path";
2940         open my $fd, '<', "$git_dir/cloneurl"
2941                 or return wantarray ?
2942                 @{ config_to_multi(git_get_project_config('url')) } :
2943                    config_to_multi(git_get_project_config('url'));
2944         my @git_project_url_list = map { chomp; $_ } <$fd>;
2945         close $fd;
2946
2947         return wantarray ? @git_project_url_list : \@git_project_url_list;
2948 }
2949
2950 sub git_get_projects_list {
2951         my $filter = shift || '';
2952         my $paranoid = shift;
2953         my @list;
2954
2955         if (-d $projects_list) {
2956                 # search in directory
2957                 my $dir = $projects_list;
2958                 # remove the trailing "/"
2959                 $dir =~ s!/+$!!;
2960                 my $pfxlen = length("$dir");
2961                 my $pfxdepth = ($dir =~ tr!/!!);
2962                 # when filtering, search only given subdirectory
2963                 if ($filter && !$paranoid) {
2964                         $dir .= "/$filter";
2965                         $dir =~ s!/+$!!;
2966                 }
2967
2968                 File::Find::find({
2969                         follow_fast => 1, # follow symbolic links
2970                         follow_skip => 2, # ignore duplicates
2971                         dangling_symlinks => 0, # ignore dangling symlinks, silently
2972                         wanted => sub {
2973                                 # global variables
2974                                 our $project_maxdepth;
2975                                 our $projectroot;
2976                                 # skip project-list toplevel, if we get it.
2977                                 return if (m!^[/.]$!);
2978                                 # only directories can be git repositories
2979                                 return unless (-d $_);
2980                                 # don't traverse too deep (Find is super slow on os x)
2981                                 # $project_maxdepth excludes depth of $projectroot
2982                                 if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2983                                         $File::Find::prune = 1;
2984                                         return;
2985                                 }
2986
2987                                 my $path = substr($File::Find::name, $pfxlen + 1);
2988                                 # paranoidly only filter here
2989                                 if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
2990                                         next;
2991                                 }
2992                                 # we check related file in $projectroot
2993                                 if (check_export_ok("$projectroot/$path")) {
2994                                         push @list, { path => $path };
2995                                         $File::Find::prune = 1;
2996                                 }
2997                         },
2998                 }, "$dir");
2999
3000         } elsif (-f $projects_list) {
3001                 # read from file(url-encoded):
3002                 # 'git%2Fgit.git Linus+Torvalds'
3003                 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3004                 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3005                 open my $fd, '<', $projects_list or return;
3006         PROJECT:
3007                 while (my $line = <$fd>) {
3008                         chomp $line;
3009                         my ($path, $owner) = split ' ', $line;
3010                         $path = unescape($path);
3011                         $owner = unescape($owner);
3012                         if (!defined $path) {
3013                                 next;
3014                         }
3015                         # if $filter is rpovided, check if $path begins with $filter
3016                         if ($filter && $path !~ m!^\Q$filter\E/!) {
3017                                 next;
3018                         }
3019                         if (check_export_ok("$projectroot/$path")) {
3020                                 my $pr = {
3021                                         path => $path
3022                                 };
3023                                 if ($owner) {
3024                                         $pr->{'owner'} = to_utf8($owner);
3025                                 }
3026                                 push @list, $pr;
3027                         }
3028                 }
3029                 close $fd;
3030         }
3031         return @list;
3032 }
3033
3034 # written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
3035 # as side effects it sets 'forks' field to list of forks for forked projects
3036 sub filter_forks_from_projects_list {
3037         my $projects = shift;
3038
3039         my %trie; # prefix tree of directories (path components)
3040         # generate trie out of those directories that might contain forks
3041         foreach my $pr (@$projects) {
3042                 my $path = $pr->{'path'};
3043                 $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
3044                 next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
3045                 next unless ($path);      # skip '.git' repository: tests, git-instaweb
3046                 next unless (-d "$projectroot/$path"); # containing directory exists
3047                 $pr->{'forks'} = [];      # there can be 0 or more forks of project
3048
3049                 # add to trie
3050                 my @dirs = split('/', $path);
3051                 # walk the trie, until either runs out of components or out of trie
3052                 my $ref = \%trie;
3053                 while (scalar @dirs &&
3054                        exists($ref->{$dirs[0]})) {
3055                         $ref = $ref->{shift @dirs};
3056                 }
3057                 # create rest of trie structure from rest of components
3058                 foreach my $dir (@dirs) {
3059                         $ref = $ref->{$dir} = {};
3060                 }
3061                 # create end marker, store $pr as a data
3062                 $ref->{''} = $pr if (!exists $ref->{''});
3063         }
3064
3065         # filter out forks, by finding shortest prefix match for paths
3066         my @filtered;
3067  PROJECT:
3068         foreach my $pr (@$projects) {
3069                 # trie lookup
3070                 my $ref = \%trie;
3071         DIR:
3072                 foreach my $dir (split('/', $pr->{'path'})) {
3073                         if (exists $ref->{''}) {
3074                                 # found [shortest] prefix, is a fork - skip it
3075                                 push @{$ref->{''}{'forks'}}, $pr;
3076                                 next PROJECT;
3077                         }
3078                         if (!exists $ref->{$dir}) {
3079                                 # not in trie, cannot have prefix, not a fork
3080                                 push @filtered, $pr;
3081                                 next PROJECT;
3082                         }
3083                         # If the dir is there, we just walk one step down the trie.
3084                         $ref = $ref->{$dir};
3085                 }
3086                 # we ran out of trie
3087                 # (shouldn't happen: it's either no match, or end marker)
3088                 push @filtered, $pr;
3089         }
3090
3091         return @filtered;
3092 }
3093
3094 # note: fill_project_list_info must be run first,
3095 # for 'descr_long' and 'ctags' to be filled
3096 sub search_projects_list {
3097         my ($projlist, %opts) = @_;
3098         my $tagfilter  = $opts{'tagfilter'};
3099         my $search_re = $opts{'search_regexp'};
3100
3101         return @$projlist
3102                 unless ($tagfilter || $search_re);
3103
3104         # searching projects require filling to be run before it;
3105         fill_project_list_info($projlist,
3106                                $tagfilter  ? 'ctags' : (),
3107                                $search_re ? ('path', 'descr') : ());
3108         my @projects;
3109  PROJECT:
3110         foreach my $pr (@$projlist) {
3111
3112                 if ($tagfilter) {
3113                         next unless ref($pr->{'ctags'}) eq 'HASH';
3114                         next unless
3115                                 grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
3116                 }
3117
3118                 if ($search_re) {
3119                         next unless
3120                                 $pr->{'path'} =~ /$search_re/ ||
3121                                 $pr->{'descr_long'} =~ /$search_re/;
3122                 }
3123
3124                 push @projects, $pr;
3125         }
3126
3127         return @projects;
3128 }
3129
3130 our $gitweb_project_owner = undef;
3131 sub git_get_project_list_from_file {
3132
3133         return if (defined $gitweb_project_owner);
3134
3135         $gitweb_project_owner = {};
3136         # read from file (url-encoded):
3137         # 'git%2Fgit.git Linus+Torvalds'
3138         # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3139         # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3140         if (-f $projects_list) {
3141                 open(my $fd, '<', $projects_list);
3142                 while (my $line = <$fd>) {
3143                         chomp $line;
3144                         my ($pr, $ow) = split ' ', $line;
3145                         $pr = unescape($pr);
3146                         $ow = unescape($ow);
3147                         $gitweb_project_owner->{$pr} = to_utf8($ow);
3148                 }
3149                 close $fd;
3150         }
3151 }
3152
3153 sub git_get_project_owner {
3154         my $project = shift;
3155         my $owner;
3156
3157         return undef unless $project;
3158         $git_dir = "$projectroot/$project";
3159
3160         if (!defined $gitweb_project_owner) {
3161                 git_get_project_list_from_file();
3162         }
3163
3164         if (exists $gitweb_project_owner->{$project}) {
3165                 $owner = $gitweb_project_owner->{$project};
3166         }
3167         if (!defined $owner){
3168                 $owner = git_get_project_config('owner');
3169         }
3170         if (!defined $owner) {
3171                 $owner = get_file_owner("$git_dir");
3172         }
3173
3174         return $owner;
3175 }
3176
3177 sub git_get_last_activity {
3178         my ($path) = @_;
3179         my $fd;
3180
3181         $git_dir = "$projectroot/$path";
3182         open($fd, "-|", git_cmd(), 'for-each-ref',
3183              '--format=%(committer)',
3184              '--sort=-committerdate',
3185              '--count=1',
3186              'refs/heads') or return;
3187         my $most_recent = <$fd>;
3188         close $fd or return;
3189         if (defined $most_recent &&
3190             $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3191                 my $timestamp = $1;
3192                 my $age = time - $timestamp;
3193                 return ($age, age_string($age));
3194         }
3195         return (undef, undef);
3196 }
3197
3198 # Implementation note: when a single remote is wanted, we cannot use 'git
3199 # remote show -n' because that command always work (assuming it's a remote URL
3200 # if it's not defined), and we cannot use 'git remote show' because that would
3201 # try to make a network roundtrip. So the only way to find if that particular
3202 # remote is defined is to walk the list provided by 'git remote -v' and stop if
3203 # and when we find what we want.
3204 sub git_get_remotes_list {
3205         my $wanted = shift;
3206         my %remotes = ();
3207
3208         open my $fd, '-|' , git_cmd(), 'remote', '-v';
3209         return unless $fd;
3210         while (my $remote = <$fd>) {
3211                 chomp $remote;
3212                 $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3213                 next if $wanted and not $remote eq $wanted;
3214                 my ($url, $key) = ($1, $2);
3215
3216                 $remotes{$remote} ||= { 'heads' => () };
3217                 $remotes{$remote}{$key} = $url;
3218         }
3219         close $fd or return;
3220         return wantarray ? %remotes : \%remotes;
3221 }
3222
3223 # Takes a hash of remotes as first parameter and fills it by adding the
3224 # available remote heads for each of the indicated remotes.
3225 sub fill_remote_heads {
3226         my $remotes = shift;
3227         my @heads = map { "remotes/$_" } keys %$remotes;
3228         my @remoteheads = git_get_heads_list(undef, @heads);
3229         foreach my $remote (keys %$remotes) {
3230                 $remotes->{$remote}{'heads'} = [ grep {
3231                         $_->{'name'} =~ s!^$remote/!!
3232                         } @remoteheads ];
3233         }
3234 }
3235
3236 sub git_get_references {
3237         my $type = shift || "";
3238         my %refs;
3239         # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3240         # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3241         open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3242                 ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3243                 or return;
3244
3245         while (my $line = <$fd>) {
3246                 chomp $line;
3247                 if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3248                         if (defined $refs{$1}) {
3249                                 push @{$refs{$1}}, $2;
3250                         } else {
3251                                 $refs{$1} = [ $2 ];
3252                         }
3253                 }
3254         }
3255         close $fd or return;
3256         return \%refs;
3257 }
3258
3259 sub git_get_rev_name_tags {
3260         my $hash = shift || return undef;
3261
3262         open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3263                 or return;
3264         my $name_rev = <$fd>;
3265         close $fd;
3266
3267         if ($name_rev =~ m|^$hash tags/(.*)$|) {
3268                 return $1;
3269         } else {
3270                 # catches also '$hash undefined' output
3271                 return undef;
3272         }
3273 }
3274
3275 ## ----------------------------------------------------------------------
3276 ## parse to hash functions
3277
3278 sub parse_date {
3279         my $epoch = shift;
3280         my $tz = shift || "-0000";
3281
3282         my %date;
3283         my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3284         my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3285         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3286         $date{'hour'} = $hour;
3287         $date{'minute'} = $min;
3288         $date{'mday'} = $mday;
3289         $date{'day'} = $days[$wday];
3290         $date{'month'} = $months[$mon];
3291         $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3292                              $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3293         $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3294                              $mday, $months[$mon], $hour ,$min;
3295         $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3296                              1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3297
3298         my ($tz_sign, $tz_hour, $tz_min) =
3299                 ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3300         $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3301         my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3302         ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3303         $date{'hour_local'} = $hour;
3304         $date{'minute_local'} = $min;
3305         $date{'tz_local'} = $tz;
3306         $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3307                                   1900+$year, $mon+1, $mday,
3308                                   $hour, $min, $sec, $tz);
3309         return %date;
3310 }
3311
3312 sub parse_tag {
3313         my $tag_id = shift;
3314         my %tag;
3315         my @comment;
3316
3317         open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3318         $tag{'id'} = $tag_id;
3319         while (my $line = <$fd>) {
3320                 chomp $line;
3321                 if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3322                         $tag{'object'} = $1;
3323                 } elsif ($line =~ m/^type (.+)$/) {
3324                         $tag{'type'} = $1;
3325                 } elsif ($line =~ m/^tag (.+)$/) {
3326                         $tag{'name'} = $1;
3327                 } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3328                         $tag{'author'} = $1;
3329                         $tag{'author_epoch'} = $2;
3330                         $tag{'author_tz'} = $3;
3331                         if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3332                                 $tag{'author_name'}  = $1;
3333                                 $tag{'author_email'} = $2;
3334                         } else {
3335                                 $tag{'author_name'} = $tag{'author'};
3336                         }
3337                 } elsif ($line =~ m/--BEGIN/) {
3338                         push @comment, $line;
3339                         last;
3340                 } elsif ($line eq "") {
3341                         last;
3342                 }
3343         }
3344         push @comment, <$fd>;
3345         $tag{'comment'} = \@comment;
3346         close $fd or return;
3347         if (!defined $tag{'name'}) {
3348                 return
3349         };
3350         return %tag
3351 }
3352
3353 sub parse_commit_text {
3354         my ($commit_text, $withparents) = @_;
3355         my @commit_lines = split '\n', $commit_text;
3356         my %co;
3357
3358         pop @commit_lines; # Remove '\0'
3359
3360         if (! @commit_lines) {
3361                 return;
3362         }
3363
3364         my $header = shift @commit_lines;
3365         if ($header !~ m/^[0-9a-fA-F]{40}/) {
3366                 return;
3367         }
3368         ($co{'id'}, my @parents) = split ' ', $header;
3369         while (my $line = shift @commit_lines) {
3370                 last if $line eq "\n";
3371                 if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3372                         $co{'tree'} = $1;
3373                 } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3374                         push @parents, $1;
3375                 } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3376                         $co{'author'} = to_utf8($1);
3377                         $co{'author_epoch'} = $2;
3378                         $co{'author_tz'} = $3;
3379                         if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3380                                 $co{'author_name'}  = $1;
3381                                 $co{'author_email'} = $2;
3382                         } else {
3383                                 $co{'author_name'} = $co{'author'};
3384                         }
3385                 } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3386                         $co{'committer'} = to_utf8($1);
3387                         $co{'committer_epoch'} = $2;
3388                         $co{'committer_tz'} = $3;
3389                         if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3390                                 $co{'committer_name'}  = $1;
3391                                 $co{'committer_email'} = $2;
3392                         } else {
3393                                 $co{'committer_name'} = $co{'committer'};
3394                         }
3395                 }
3396         }
3397         if (!defined $co{'tree'}) {
3398                 return;
3399         };
3400         $co{'parents'} = \@parents;
3401         $co{'parent'} = $parents[0];
3402
3403         foreach my $title (@commit_lines) {
3404                 $title =~ s/^    //;
3405                 if ($title ne "") {
3406                         $co{'title'} = chop_str($title, 80, 5);
3407                         # remove leading stuff of merges to make the interesting part visible
3408                         if (length($title) > 50) {
3409                                 $title =~ s/^Automatic //;
3410                                 $title =~ s/^merge (of|with) /Merge ... /i;
3411                                 if (length($title) > 50) {
3412                                         $title =~ s/(http|rsync):\/\///;
3413                                 }
3414                                 if (length($title) > 50) {
3415                                         $title =~ s/(master|www|rsync)\.//;
3416                                 }
3417                                 if (length($title) > 50) {
3418                                         $title =~ s/kernel.org:?//;
3419                                 }
3420                                 if (length($title) > 50) {
3421                                         $title =~ s/\/pub\/scm//;
3422                                 }
3423                         }
3424                         $co{'title_short'} = chop_str($title, 50, 5);
3425                         last;
3426                 }
3427         }
3428         if (! defined $co{'title'} || $co{'title'} eq "") {
3429                 $co{'title'} = $co{'title_short'} = '(no commit message)';
3430         }
3431         # remove added spaces
3432         foreach my $line (@commit_lines) {
3433                 $line =~ s/^    //;
3434         }
3435         $co{'comment'} = \@commit_lines;
3436
3437         my $age = time - $co{'committer_epoch'};
3438         $co{'age'} = $age;
3439         $co{'age_string'} = age_string($age);
3440         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3441         if ($age > 60*60*24*7*2) {
3442                 $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3443                 $co{'age_string_age'} = $co{'age_string'};
3444         } else {
3445                 $co{'age_string_date'} = $co{'age_string'};
3446                 $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3447         }
3448         return %co;
3449 }
3450
3451 sub parse_commit {
3452         my ($commit_id) = @_;
3453         my %co;
3454
3455         local $/ = "\0";
3456
3457         open my $fd, "-|", git_cmd(), "rev-list",
3458                 "--parents",
3459                 "--header",
3460                 "--max-count=1",
3461                 $commit_id,
3462                 "--",
3463                 or die_error(500, "Open git-rev-list failed");
3464         %co = parse_commit_text(<$fd>, 1);
3465         close $fd;
3466
3467         return %co;
3468 }
3469
3470 sub parse_commits {
3471         my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3472         my @cos;
3473
3474         $maxcount ||= 1;
3475         $skip ||= 0;
3476
3477         local $/ = "\0";
3478
3479         open my $fd, "-|", git_cmd(), "rev-list",
3480                 "--header",
3481                 @args,
3482                 ("--max-count=" . $maxcount),
3483                 ("--skip=" . $skip),
3484                 @extra_options,
3485                 $commit_id,
3486                 "--",
3487                 ($filename ? ($filename) : ())
3488                 or die_error(500, "Open git-rev-list failed");
3489         while (my $line = <$fd>) {
3490                 my %co = parse_commit_text($line);
3491                 push @cos, \%co;
3492         }
3493         close $fd;
3494
3495         return wantarray ? @cos : \@cos;
3496 }
3497
3498 # parse line of git-diff-tree "raw" output
3499 sub parse_difftree_raw_line {
3500         my $line = shift;
3501         my %res;
3502
3503         # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3504         # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3505         if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3506                 $res{'from_mode'} = $1;
3507                 $res{'to_mode'} = $2;
3508                 $res{'from_id'} = $3;
3509                 $res{'to_id'} = $4;
3510                 $res{'status'} = $5;
3511                 $res{'similarity'} = $6;
3512                 if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3513                         ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3514                 } else {
3515                         $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3516                 }
3517         }
3518         # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3519         # combined diff (for merge commit)
3520         elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3521                 $res{'nparents'}  = length($1);
3522                 $res{'from_mode'} = [ split(' ', $2) ];
3523                 $res{'to_mode'} = pop @{$res{'from_mode'}};
3524                 $res{'from_id'} = [ split(' ', $3) ];
3525                 $res{'to_id'} = pop @{$res{'from_id'}};
3526                 $res{'status'} = [ split('', $4) ];
3527                 $res{'to_file'} = unquote($5);
3528         }
3529         # 'c512b523472485aef4fff9e57b229d9d243c967f'
3530         elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3531                 $res{'commit'} = $1;
3532         }
3533
3534         return wantarray ? %res : \%res;
3535 }
3536
3537 # wrapper: return parsed line of git-diff-tree "raw" output
3538 # (the argument might be raw line, or parsed info)
3539 sub parsed_difftree_line {
3540         my $line_or_ref = shift;
3541
3542         if (ref($line_or_ref) eq "HASH") {
3543                 # pre-parsed (or generated by hand)
3544                 return $line_or_ref;
3545         } else {
3546                 return parse_difftree_raw_line($line_or_ref);
3547         }
3548 }
3549
3550 # parse line of git-ls-tree output
3551 sub parse_ls_tree_line {
3552         my $line = shift;
3553         my %opts = @_;
3554         my %res;
3555
3556         if ($opts{'-l'}) {
3557                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3558                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3559
3560                 $res{'mode'} = $1;
3561                 $res{'type'} = $2;
3562                 $res{'hash'} = $3;
3563                 $res{'size'} = $4;
3564                 if ($opts{'-z'}) {
3565                         $res{'name'} = $5;
3566                 } else {
3567                         $res{'name'} = unquote($5);
3568                 }
3569         } else {
3570                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3571                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3572
3573                 $res{'mode'} = $1;
3574                 $res{'type'} = $2;
3575                 $res{'hash'} = $3;
3576                 if ($opts{'-z'}) {
3577                         $res{'name'} = $4;
3578                 } else {
3579                         $res{'name'} = unquote($4);
3580                 }
3581         }
3582
3583         return wantarray ? %res : \%res;
3584 }
3585
3586 # generates _two_ hashes, references to which are passed as 2 and 3 argument
3587 sub parse_from_to_diffinfo {
3588         my ($diffinfo, $from, $to, @parents) = @_;
3589
3590         if ($diffinfo->{'nparents'}) {
3591                 # combined diff
3592                 $from->{'file'} = [];
3593                 $from->{'href'} = [];
3594                 fill_from_file_info($diffinfo, @parents)
3595                         unless exists $diffinfo->{'from_file'};
3596                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3597                         $from->{'file'}[$i] =
3598                                 defined $diffinfo->{'from_file'}[$i] ?
3599                                         $diffinfo->{'from_file'}[$i] :
3600                                         $diffinfo->{'to_file'};
3601                         if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3602                                 $from->{'href'}[$i] = href(action=>"blob",
3603                                                            hash_base=>$parents[$i],
3604                                                            hash=>$diffinfo->{'from_id'}[$i],
3605                                                            file_name=>$from->{'file'}[$i]);
3606                         } else {
3607                                 $from->{'href'}[$i] = undef;
3608                         }
3609                 }
3610         } else {
3611                 # ordinary (not combined) diff
3612                 $from->{'file'} = $diffinfo->{'from_file'};
3613                 if ($diffinfo->{'status'} ne "A") { # not new (added) file
3614                         $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3615                                                hash=>$diffinfo->{'from_id'},
3616                                                file_name=>$from->{'file'});
3617                 } else {
3618                         delete $from->{'href'};
3619                 }
3620         }
3621
3622         $to->{'file'} = $diffinfo->{'to_file'};
3623         if (!is_deleted($diffinfo)) { # file exists in result
3624                 $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3625                                      hash=>$diffinfo->{'to_id'},
3626                                      file_name=>$to->{'file'});
3627         } else {
3628                 delete $to->{'href'};
3629         }
3630 }
3631
3632 ## ......................................................................
3633 ## parse to array of hashes functions
3634
3635 sub git_get_heads_list {
3636         my ($limit, @classes) = @_;
3637         @classes = ('heads') unless @classes;
3638         my @patterns = map { "refs/$_" } @classes;
3639         my @headslist;
3640
3641         open my $fd, '-|', git_cmd(), 'for-each-ref',
3642                 ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3643                 '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3644                 @patterns
3645                 or return;
3646         while (my $line = <$fd>) {
3647                 my %ref_item;
3648
3649                 chomp $line;
3650                 my ($refinfo, $committerinfo) = split(/\0/, $line);
3651                 my ($hash, $name, $title) = split(' ', $refinfo, 3);
3652                 my ($committer, $epoch, $tz) =
3653                         ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3654                 $ref_item{'fullname'}  = $name;
3655                 $name =~ s!^refs/(?:head|remote)s/!!;
3656
3657                 $ref_item{'name'}  = $name;
3658                 $ref_item{'id'}    = $hash;
3659                 $ref_item{'title'} = $title || '(no commit message)';
3660                 $ref_item{'epoch'} = $epoch;
3661                 if ($epoch) {
3662                         $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3663                 } else {
3664                         $ref_item{'age'} = "unknown";
3665                 }
3666
3667                 push @headslist, \%ref_item;
3668         }
3669         close $fd;
3670
3671         return wantarray ? @headslist : \@headslist;
3672 }
3673
3674 sub git_get_tags_list {
3675         my $limit = shift;
3676         my @tagslist;
3677
3678         open my $fd, '-|', git_cmd(), 'for-each-ref',
3679                 ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3680                 '--format=%(objectname) %(objecttype) %(refname) '.
3681                 '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3682                 'refs/tags'
3683                 or return;
3684         while (my $line = <$fd>) {
3685                 my %ref_item;
3686
3687                 chomp $line;
3688                 my ($refinfo, $creatorinfo) = split(/\0/, $line);
3689                 my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3690                 my ($creator, $epoch, $tz) =
3691                         ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3692                 $ref_item{'fullname'} = $name;
3693                 $name =~ s!^refs/tags/!!;
3694
3695                 $ref_item{'type'} = $type;
3696                 $ref_item{'id'} = $id;
3697                 $ref_item{'name'} = $name;
3698                 if ($type eq "tag") {
3699                         $ref_item{'subject'} = $title;
3700                         $ref_item{'reftype'} = $reftype;
3701                         $ref_item{'refid'}   = $refid;
3702                 } else {
3703                         $ref_item{'reftype'} = $type;
3704                         $ref_item{'refid'}   = $id;
3705                 }
3706
3707                 if ($type eq "tag" || $type eq "commit") {
3708                         $ref_item{'epoch'} = $epoch;
3709                         if ($epoch) {
3710                                 $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3711                         } else {
3712                                 $ref_item{'age'} = "unknown";
3713                         }
3714                 }
3715
3716                 push @tagslist, \%ref_item;
3717         }
3718         close $fd;
3719
3720         return wantarray ? @tagslist : \@tagslist;
3721 }
3722
3723 ## ----------------------------------------------------------------------
3724 ## filesystem-related functions
3725
3726 sub get_file_owner {
3727         my $path = shift;
3728
3729         my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3730         my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3731         if (!defined $gcos) {
3732                 return undef;
3733         }
3734         my $owner = $gcos;
3735         $owner =~ s/[,;].*$//;
3736         return to_utf8($owner);
3737 }
3738
3739 # assume that file exists
3740 sub insert_file {
3741         my $filename = shift;
3742
3743         open my $fd, '<', $filename;
3744         print map { to_utf8($_) } <$fd>;
3745         close $fd;
3746 }
3747
3748 ## ......................................................................
3749 ## mimetype related functions
3750
3751 sub mimetype_guess_file {
3752         my $filename = shift;
3753         my $mimemap = shift;
3754         -r $mimemap or return undef;
3755
3756         my %mimemap;
3757         open(my $mh, '<', $mimemap) or return undef;
3758         while (<$mh>) {
3759                 next if m/^#/; # skip comments
3760                 my ($mimetype, @exts) = split(/\s+/);
3761                 foreach my $ext (@exts) {
3762                         $mimemap{$ext} = $mimetype;
3763                 }
3764         }
3765         close($mh);
3766
3767         $filename =~ /\.([^.]*)$/;
3768         return $mimemap{$1};
3769 }
3770
3771 sub mimetype_guess {
3772         my $filename = shift;
3773         my $mime;
3774         $filename =~ /\./ or return undef;
3775
3776         if ($mimetypes_file) {
3777                 my $file = $mimetypes_file;
3778                 if ($file !~ m!^/!) { # if it is relative path
3779                         # it is relative to project
3780                         $file = "$projectroot/$project/$file";
3781                 }
3782                 $mime = mimetype_guess_file($filename, $file);
3783         }
3784         $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3785         return $mime;
3786 }
3787
3788 sub blob_mimetype {
3789         my $fd = shift;
3790         my $filename = shift;
3791
3792         if ($filename) {
3793                 my $mime = mimetype_guess($filename);
3794                 $mime and return $mime;
3795         }
3796
3797         # just in case
3798         return $default_blob_plain_mimetype unless $fd;
3799
3800         if (-T $fd) {
3801                 return 'text/plain';
3802         } elsif (! $filename) {
3803                 return 'application/octet-stream';
3804         } elsif ($filename =~ m/\.png$/i) {
3805                 return 'image/png';
3806         } elsif ($filename =~ m/\.gif$/i) {
3807                 return 'image/gif';
3808         } elsif ($filename =~ m/\.jpe?g$/i) {
3809                 return 'image/jpeg';
3810         } else {
3811                 return 'application/octet-stream';
3812         }
3813 }
3814
3815 sub blob_contenttype {
3816         my ($fd, $file_name, $type) = @_;
3817
3818         $type ||= blob_mimetype($fd, $file_name);
3819         if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3820                 $type .= "; charset=$default_text_plain_charset";
3821         }
3822
3823         return $type;
3824 }
3825
3826 # guess file syntax for syntax highlighting; return undef if no highlighting
3827 # the name of syntax can (in the future) depend on syntax highlighter used
3828 sub guess_file_syntax {
3829         my ($highlight, $mimetype, $file_name) = @_;
3830         return undef unless ($highlight && defined $file_name);
3831         my $basename = basename($file_name, '.in');
3832         return $highlight_basename{$basename}
3833                 if exists $highlight_basename{$basename};
3834
3835         $basename =~ /\.([^.]*)$/;
3836         my $ext = $1 or return undef;
3837         return $highlight_ext{$ext}
3838                 if exists $highlight_ext{$ext};
3839
3840         return undef;
3841 }
3842
3843 # run highlighter and return FD of its output,
3844 # or return original FD if no highlighting
3845 sub run_highlighter {
3846         my ($fd, $highlight, $syntax) = @_;
3847         return $fd unless ($highlight && defined $syntax);
3848
3849         close $fd;
3850         open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3851                   quote_command($highlight_bin).
3852                   " --replace-tabs=8 --fragment --syntax $syntax |"
3853                 or die_error(500, "Couldn't open file or run syntax highlighter");
3854         return $fd;
3855 }
3856
3857 ## ======================================================================
3858 ## functions printing HTML: header, footer, error page
3859
3860 sub get_page_title {
3861         my $title = to_utf8($site_name);
3862
3863         unless (defined $project) {
3864                 if (defined $project_filter) {
3865                         $title .= " - projects in '" . esc_path($project_filter) . "'";
3866                 }
3867                 return $title;
3868         }
3869         $title .= " - " . to_utf8($project);
3870
3871         return $title unless (defined $action);
3872         $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3873
3874         return $title unless (defined $file_name);
3875         $title .= " - " . esc_path($file_name);
3876         if ($action eq "tree" && $file_name !~ m|/$|) {
3877                 $title .= "/";
3878         }
3879
3880         return $title;
3881 }
3882
3883 sub get_content_type_html {
3884         # require explicit support from the UA if we are to send the page as
3885         # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3886         # we have to do this because MSIE sometimes globs '*/*', pretending to
3887         # support xhtml+xml but choking when it gets what it asked for.
3888         if (defined $cgi->http('HTTP_ACCEPT') &&
3889             $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3890             $cgi->Accept('application/xhtml+xml') != 0) {
3891                 return 'application/xhtml+xml';
3892         } else {
3893                 return 'text/html';
3894         }
3895 }
3896
3897 sub print_feed_meta {
3898         if (defined $project) {
3899                 my %href_params = get_feed_info();
3900                 if (!exists $href_params{'-title'}) {
3901                         $href_params{'-title'} = 'log';
3902                 }
3903
3904                 foreach my $format (qw(RSS Atom)) {
3905                         my $type = lc($format);
3906                         my %link_attr = (
3907                                 '-rel' => 'alternate',
3908                                 '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3909                                 '-type' => "application/$type+xml"
3910                         );
3911
3912                         $href_params{'extra_options'} = undef;
3913                         $href_params{'action'} = $type;
3914                         $link_attr{'-href'} = href(%href_params);
3915                         print "<link ".
3916                               "rel=\"$link_attr{'-rel'}\" ".
3917                               "title=\"$link_attr{'-title'}\" ".
3918                               "href=\"$link_attr{'-href'}\" ".
3919                               "type=\"$link_attr{'-type'}\" ".
3920                               "/>\n";
3921
3922                         $href_params{'extra_options'} = '--no-merges';
3923                         $link_attr{'-href'} = href(%href_params);
3924                         $link_attr{'-title'} .= ' (no merges)';
3925                         print "<link ".
3926                               "rel=\"$link_attr{'-rel'}\" ".
3927                               "title=\"$link_attr{'-title'}\" ".
3928                               "href=\"$link_attr{'-href'}\" ".
3929                               "type=\"$link_attr{'-type'}\" ".
3930                               "/>\n";
3931                 }
3932
3933         } else {
3934                 printf('<link rel="alternate" title="%s projects list" '.
3935                        'href="%s" type="text/plain; charset=utf-8" />'."\n",
3936                        esc_attr($site_name), href(project=>undef, action=>"project_index"));
3937                 printf('<link rel="alternate" title="%s projects feeds" '.
3938                        'href="%s" type="text/x-opml" />'."\n",
3939                        esc_attr($site_name), href(project=>undef, action=>"opml"));
3940         }
3941 }
3942
3943 sub print_header_links {
3944         my $status = shift;
3945
3946         # print out each stylesheet that exist, providing backwards capability
3947         # for those people who defined $stylesheet in a config file
3948         if (defined $stylesheet) {
3949                 print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3950         } else {
3951                 foreach my $stylesheet (@stylesheets) {
3952                         next unless $stylesheet;
3953                         print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3954                 }
3955         }
3956         print_feed_meta()
3957                 if ($status eq '200 OK');
3958         if (defined $favicon) {
3959                 print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3960         }
3961 }
3962
3963 sub print_nav_breadcrumbs_path {
3964         my $dirprefix = undef;
3965         while (my $part = shift) {
3966                 $dirprefix .= "/" if defined $dirprefix;
3967                 $dirprefix .= $part;
3968                 print $cgi->a({-href => href(project => undef,
3969                                              project_filter => $dirprefix,
3970                                              action => "project_list")},
3971                               esc_html($part)) . " / ";
3972         }
3973 }
3974
3975 sub print_nav_breadcrumbs {
3976         my %opts = @_;
3977
3978         print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3979         if (defined $project) {
3980                 my @dirname = split '/', $project;
3981                 my $projectbasename = pop @dirname;
3982                 print_nav_breadcrumbs_path(@dirname);
3983                 print $cgi->a({-href => href(action=>"summary")}, esc_html($projectbasename));
3984                 if (defined $action) {
3985                         my $action_print = $action ;
3986                         if (defined $opts{-action_extra}) {
3987                                 $action_print = $cgi->a({-href => href(action=>$action)},
3988                                         $action);
3989                         }
3990                         print " / $action_print";
3991                 }
3992                 if (defined $opts{-action_extra}) {
3993                         print " / $opts{-action_extra}";
3994                 }
3995                 print "\n";
3996         } elsif (defined $project_filter) {
3997                 print_nav_breadcrumbs_path(split '/', $project_filter);
3998         }
3999 }
4000
4001 sub print_search_form {
4002         if (!defined $searchtext) {
4003                 $searchtext = "";
4004         }
4005         my $search_hash;
4006         if (defined $hash_base) {
4007                 $search_hash = $hash_base;
4008         } elsif (defined $hash) {
4009                 $search_hash = $hash;
4010         } else {
4011                 $search_hash = "HEAD";
4012         }
4013         my $action = $my_uri;
4014         my $use_pathinfo = gitweb_check_feature('pathinfo');
4015         if ($use_pathinfo) {
4016                 $action .= "/".esc_url($project);
4017         }
4018         print $cgi->startform(-method => "get", -action => $action) .
4019               "<div class=\"search\">\n" .
4020               (!$use_pathinfo &&
4021               $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
4022               $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
4023               $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
4024               $cgi->popup_menu(-name => 'st', -default => 'commit',
4025                                -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
4026               $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
4027               " search:\n",
4028               $cgi->textfield(-name => "s", -value => $searchtext, -override => 1) . "\n" .
4029               "<span title=\"Extended regular expression\">" .
4030               $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
4031                              -checked => $search_use_regexp) .
4032               "</span>" .
4033               "</div>" .
4034               $cgi->end_form() . "\n";
4035 }
4036
4037 sub git_header_html {
4038         my $status = shift || "200 OK";
4039         my $expires = shift;
4040         my %opts = @_;
4041
4042         my $title = get_page_title();
4043         my $content_type = get_content_type_html();
4044         print $cgi->header(-type=>$content_type, -charset => 'utf-8',
4045                            -status=> $status, -expires => $expires)
4046                 unless ($opts{'-no_http_header'});
4047         my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
4048         print <<EOF;
4049 <?xml version="1.0" encoding="utf-8"?>
4050 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
4051 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
4052 <!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
4053 <!-- git core binaries version $git_version -->
4054 <head>
4055 <meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
4056 <meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
4057 <meta name="robots" content="index, nofollow"/>
4058 <title>$title</title>
4059 EOF
4060         # the stylesheet, favicon etc urls won't work correctly with path_info
4061         # unless we set the appropriate base URL
4062         if ($ENV{'PATH_INFO'}) {
4063                 print "<base href=\"".esc_url($base_url)."\" />\n";
4064         }
4065         print_header_links($status);
4066
4067         if (defined $site_html_head_string) {
4068                 print to_utf8($site_html_head_string);
4069         }
4070
4071         print "</head>\n" .
4072               "<body>\n";
4073
4074         if (defined $site_header && -f $site_header) {
4075                 insert_file($site_header);
4076         }
4077
4078         print "<div class=\"page_header\">\n";
4079         if (defined $logo) {
4080                 print $cgi->a({-href => esc_url($logo_url),
4081                                -title => $logo_label},
4082                               $cgi->img({-src => esc_url($logo),
4083                                          -width => 72, -height => 27,
4084                                          -alt => "git",
4085                                          -class => "logo"}));
4086         }
4087         print_nav_breadcrumbs(%opts);
4088         print "</div>\n";
4089
4090         my $have_search = gitweb_check_feature('search');
4091         if (defined $project && $have_search) {
4092                 print_search_form();
4093         }
4094 }
4095
4096 sub git_footer_html {
4097         my $feed_class = 'rss_logo';
4098
4099         print "<div class=\"page_footer\">\n";
4100         if (defined $project) {
4101                 my $descr = git_get_project_description($project);
4102                 if (defined $descr) {
4103                         print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
4104                 }
4105
4106                 my %href_params = get_feed_info();
4107                 if (!%href_params) {
4108                         $feed_class .= ' generic';
4109                 }
4110                 $href_params{'-title'} ||= 'log';
4111
4112                 foreach my $format (qw(RSS Atom)) {
4113                         $href_params{'action'} = lc($format);
4114                         print $cgi->a({-href => href(%href_params),
4115                                       -title => "$href_params{'-title'} $format feed",
4116                                       -class => $feed_class}, $format)."\n";
4117                 }
4118
4119         } else {
4120                 print $cgi->a({-href => href(project=>undef, action=>"opml",
4121                                              project_filter => $project_filter),
4122                               -class => $feed_class}, "OPML") . " ";
4123                 print $cgi->a({-href => href(project=>undef, action=>"project_index",
4124                                              project_filter => $project_filter),
4125                               -class => $feed_class}, "TXT") . "\n";
4126         }
4127         print "</div>\n"; # class="page_footer"
4128
4129         if (defined $t0 && gitweb_check_feature('timed')) {
4130                 print "<div id=\"generating_info\">\n";
4131                 print 'This page took '.
4132                       '<span id="generating_time" class="time_span">'.
4133                       tv_interval($t0, [ gettimeofday() ]).
4134                       ' seconds </span>'.
4135                       ' and '.
4136                       '<span id="generating_cmd">'.
4137                       $number_of_git_cmds.
4138                       '</span> git commands '.
4139                       " to generate.\n";
4140                 print "</div>\n"; # class="page_footer"
4141         }
4142
4143         if (defined $site_footer && -f $site_footer) {
4144                 insert_file($site_footer);
4145         }
4146
4147         print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
4148         if (defined $action &&
4149             $action eq 'blame_incremental') {
4150                 print qq!<script type="text/javascript">\n!.
4151                       qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
4152                       qq!           "!. href() .qq!");\n!.
4153                       qq!</script>\n!;
4154         } else {
4155                 my ($jstimezone, $tz_cookie, $datetime_class) =
4156                         gitweb_get_feature('javascript-timezone');
4157
4158                 print qq!<script type="text/javascript">\n!.
4159                       qq!window.onload = function () {\n!;
4160                 if (gitweb_check_feature('javascript-actions')) {
4161                         print qq!       fixLinks();\n!;
4162                 }
4163                 if ($jstimezone && $tz_cookie && $datetime_class) {
4164                         print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4165                               qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4166                 }
4167                 print qq!};\n!.
4168                       qq!</script>\n!;
4169         }
4170
4171         print "</body>\n" .
4172               "</html>";
4173 }
4174
4175 # die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4176 # Example: die_error(404, 'Hash not found')
4177 # By convention, use the following status codes (as defined in RFC 2616):
4178 # 400: Invalid or missing CGI parameters, or
4179 #      requested object exists but has wrong type.
4180 # 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4181 #      this server or project.
4182 # 404: Requested object/revision/project doesn't exist.
4183 # 500: The server isn't configured properly, or
4184 #      an internal error occurred (e.g. failed assertions caused by bugs), or
4185 #      an unknown error occurred (e.g. the git binary died unexpectedly).
4186 # 503: The server is currently unavailable (because it is overloaded,
4187 #      or down for maintenance).  Generally, this is a temporary state.
4188 sub die_error {
4189         my $status = shift || 500;
4190         my $error = esc_html(shift) || "Internal Server Error";
4191         my $extra = shift;
4192         my %opts = @_;
4193
4194         my %http_responses = (
4195                 400 => '400 Bad Request',
4196                 403 => '403 Forbidden',
4197                 404 => '404 Not Found',
4198                 500 => '500 Internal Server Error',
4199                 503 => '503 Service Unavailable',
4200         );
4201         git_header_html($http_responses{$status}, undef, %opts);
4202         print <<EOF;
4203 <div class="page_body">
4204 <br /><br />
4205 $status - $error
4206 <br />
4207 EOF
4208         if (defined $extra) {
4209                 print "<hr />\n" .
4210                       "$extra\n";
4211         }
4212         print "</div>\n";
4213
4214         git_footer_html();
4215         goto DONE_GITWEB
4216                 unless ($opts{'-error_handler'});
4217 }
4218
4219 ## ----------------------------------------------------------------------
4220 ## functions printing or outputting HTML: navigation
4221
4222 sub git_print_page_nav {
4223         my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4224         $extra = '' if !defined $extra; # pager or formats
4225
4226         my @navs = qw(summary shortlog log commit commitdiff tree);
4227         if ($suppress) {
4228                 @navs = grep { $_ ne $suppress } @navs;
4229         }
4230
4231         my %arg = map { $_ => {action=>$_} } @navs;
4232         if (defined $head) {
4233                 for (qw(commit commitdiff)) {
4234                         $arg{$_}{'hash'} = $head;
4235                 }
4236                 if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4237                         for (qw(shortlog log)) {
4238                                 $arg{$_}{'hash'} = $head;
4239                         }
4240                 }
4241         }
4242
4243         $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4244         $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4245
4246         my @actions = gitweb_get_feature('actions');
4247         my %repl = (
4248                 '%' => '%',
4249                 'n' => $project,         # project name
4250                 'f' => $git_dir,         # project path within filesystem
4251                 'h' => $treehead || '',  # current hash ('h' parameter)
4252                 'b' => $treebase || '',  # hash base ('hb' parameter)
4253         );
4254         while (@actions) {
4255                 my ($label, $link, $pos) = splice(@actions,0,3);
4256                 # insert
4257                 @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4258                 # munch munch
4259                 $link =~ s/%([%nfhb])/$repl{$1}/g;
4260                 $arg{$label}{'_href'} = $link;
4261         }
4262
4263         print "<div class=\"page_nav\">\n" .
4264                 (join " | ",
4265                  map { $_ eq $current ?
4266                        $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4267                  } @navs);
4268         print "<br/>\n$extra<br/>\n" .
4269               "</div>\n";
4270 }
4271
4272 # returns a submenu for the nagivation of the refs views (tags, heads,
4273 # remotes) with the current view disabled and the remotes view only
4274 # available if the feature is enabled
4275 sub format_ref_views {
4276         my ($current) = @_;
4277         my @ref_views = qw{tags heads};
4278         push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4279         return join " | ", map {
4280                 $_ eq $current ? $_ :
4281                 $cgi->a({-href => href(action=>$_)}, $_)
4282         } @ref_views
4283 }
4284
4285 sub format_paging_nav {
4286         my ($action, $page, $has_next_link) = @_;
4287         my $paging_nav;
4288
4289
4290         if ($page > 0) {
4291                 $paging_nav .=
4292                         $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4293                         " &sdot; " .
4294                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
4295                                  -accesskey => "p", -title => "Alt-p"}, "prev");
4296         } else {
4297                 $paging_nav .= "first &sdot; prev";
4298         }
4299
4300         if ($has_next_link) {
4301                 $paging_nav .= " &sdot; " .
4302                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
4303                                  -accesskey => "n", -title => "Alt-n"}, "next");
4304         } else {
4305                 $paging_nav .= " &sdot; next";
4306         }
4307
4308         return $paging_nav;
4309 }
4310
4311 ## ......................................................................
4312 ## functions printing or outputting HTML: div
4313
4314 sub git_print_header_div {
4315         my ($action, $title, $hash, $hash_base) = @_;
4316         my %args = ();
4317
4318         $args{'action'} = $action;
4319         $args{'hash'} = $hash if $hash;
4320         $args{'hash_base'} = $hash_base if $hash_base;
4321
4322         print "<div class=\"header\">\n" .
4323               $cgi->a({-href => href(%args), -class => "title"},
4324               $title ? $title : $action) .
4325               "\n</div>\n";
4326 }
4327
4328 sub format_repo_url {
4329         my ($name, $url) = @_;
4330         return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4331 }
4332
4333 # Group output by placing it in a DIV element and adding a header.
4334 # Options for start_div() can be provided by passing a hash reference as the
4335 # first parameter to the function.
4336 # Options to git_print_header_div() can be provided by passing an array
4337 # reference. This must follow the options to start_div if they are present.
4338 # The content can be a scalar, which is output as-is, a scalar reference, which
4339 # is output after html escaping, an IO handle passed either as *handle or
4340 # *handle{IO}, or a function reference. In the latter case all following
4341 # parameters will be taken as argument to the content function call.
4342 sub git_print_section {
4343         my ($div_args, $header_args, $content);
4344         my $arg = shift;
4345         if (ref($arg) eq 'HASH') {
4346                 $div_args = $arg;
4347                 $arg = shift;
4348         }
4349         if (ref($arg) eq 'ARRAY') {
4350                 $header_args = $arg;
4351                 $arg = shift;
4352         }
4353         $content = $arg;
4354
4355         print $cgi->start_div($div_args);
4356         git_print_header_div(@$header_args);
4357
4358         if (ref($content) eq 'CODE') {
4359                 $content->(@_);
4360         } elsif (ref($content) eq 'SCALAR') {
4361                 print esc_html($$content);
4362         } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4363                 print <$content>;
4364         } elsif (!ref($content) && defined($content)) {
4365                 print $content;
4366         }
4367
4368         print $cgi->end_div;
4369 }
4370
4371 sub format_timestamp_html {
4372         my $date = shift;
4373         my $strtime = $date->{'rfc2822'};
4374
4375         my (undef, undef, $datetime_class) =
4376                 gitweb_get_feature('javascript-timezone');
4377         if ($datetime_class) {
4378                 $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4379         }
4380
4381         my $localtime_format = '(%02d:%02d %s)';
4382         if ($date->{'hour_local'} < 6) {
4383                 $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4384         }
4385         $strtime .= ' ' .
4386                     sprintf($localtime_format,
4387                             $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4388
4389         return $strtime;
4390 }
4391
4392 # Outputs the author name and date in long form
4393 sub git_print_authorship {
4394         my $co = shift;
4395         my %opts = @_;
4396         my $tag = $opts{-tag} || 'div';
4397         my $author = $co->{'author_name'};
4398
4399         my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4400         print "<$tag class=\"author_date\">" .
4401               format_search_author($author, "author", esc_html($author)) .
4402               " [".format_timestamp_html(\%ad)."]".
4403               git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4404               "</$tag>\n";
4405 }
4406
4407 # Outputs table rows containing the full author or committer information,
4408 # in the format expected for 'commit' view (& similar).
4409 # Parameters are a commit hash reference, followed by the list of people
4410 # to output information for. If the list is empty it defaults to both
4411 # author and committer.
4412 sub git_print_authorship_rows {
4413         my $co = shift;
4414         # too bad we can't use @people = @_ || ('author', 'committer')
4415         my @people = @_;
4416         @people = ('author', 'committer') unless @people;
4417         foreach my $who (@people) {
4418                 my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4419                 print "<tr><td>$who</td><td>" .
4420                       format_search_author($co->{"${who}_name"}, $who,
4421                                            esc_html($co->{"${who}_name"})) . " " .
4422                       format_search_author($co->{"${who}_email"}, $who,
4423                                            esc_html("<" . $co->{"${who}_email"} . ">")) .
4424                       "</td><td rowspan=\"2\">" .
4425                       git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4426                       "</td></tr>\n" .
4427                       "<tr>" .
4428                       "<td></td><td>" .
4429                       format_timestamp_html(\%wd) .
4430                       "</td>" .
4431                       "</tr>\n";
4432         }
4433 }
4434
4435 sub git_print_page_path {
4436         my $name = shift;
4437         my $type = shift;
4438         my $hb = shift;
4439
4440
4441         print "<div class=\"page_path\">";
4442         print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4443                       -title => 'tree root'}, to_utf8("[$project]"));
4444         print " / ";
4445         if (defined $name) {
4446                 my @dirname = split '/', $name;
4447                 my $basename = pop @dirname;
4448                 my $fullname = '';
4449
4450                 foreach my $dir (@dirname) {
4451                         $fullname .= ($fullname ? '/' : '') . $dir;
4452                         print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4453                                                      hash_base=>$hb),
4454                                       -title => $fullname}, esc_path($dir));
4455                         print " / ";
4456                 }
4457                 if (defined $type && $type eq 'blob') {
4458                         print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4459                                                      hash_base=>$hb),
4460                                       -title => $name}, esc_path($basename));
4461                 } elsif (defined $type && $type eq 'tree') {
4462                         print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4463                                                      hash_base=>$hb),
4464                                       -title => $name}, esc_path($basename));
4465                         print " / ";
4466                 } else {
4467                         print esc_path($basename);
4468                 }
4469         }
4470         print "<br/></div>\n";
4471 }
4472
4473 sub git_print_log {
4474         my $log = shift;
4475         my %opts = @_;
4476
4477         if ($opts{'-remove_title'}) {
4478                 # remove title, i.e. first line of log
4479                 shift @$log;
4480         }
4481         # remove leading empty lines
4482         while (defined $log->[0] && $log->[0] eq "") {
4483                 shift @$log;
4484         }
4485
4486         # print log
4487         my $skip_blank_line = 0;
4488         foreach my $line (@$log) {
4489                 if ($line =~ m/^\s*([A-Z][-A-Za-z]*-[Bb]y|C[Cc]): /) {
4490                         if (! $opts{'-remove_signoff'}) {
4491                                 print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4492                                 $skip_blank_line = 1;
4493                         }
4494                         next;
4495                 }
4496
4497                 if ($line =~ m,\s*([a-z]*link): (https?://\S+),i) {
4498                         if (! $opts{'-remove_signoff'}) {
4499                                 print "<span class=\"signoff\">" . esc_html($1) . ": " .
4500                                         "<a href=\"" . esc_html($2) . "\">" . esc_html($2) . "</a>" .
4501                                         "</span><br/>\n";
4502                                 $skip_blank_line = 1;
4503                         }
4504                         next;
4505                 }
4506
4507                 # print only one empty line
4508                 # do not print empty line after signoff
4509                 if ($line eq "") {
4510                         next if ($skip_blank_line);
4511                         $skip_blank_line = 1;
4512                 } else {
4513                         $skip_blank_line = 0;
4514                 }
4515
4516                 print format_log_line_html($line) . "<br/>\n";
4517         }
4518
4519         if ($opts{'-final_empty_line'}) {
4520                 # end with single empty line
4521                 print "<br/>\n" unless $skip_blank_line;
4522         }
4523 }
4524
4525 # return link target (what link points to)
4526 sub git_get_link_target {
4527         my $hash = shift;
4528         my $link_target;
4529
4530         # read link
4531         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4532                 or return;
4533         {
4534                 local $/ = undef;
4535                 $link_target = <$fd>;
4536         }
4537         close $fd
4538                 or return;
4539
4540         return $link_target;
4541 }
4542
4543 # given link target, and the directory (basedir) the link is in,
4544 # return target of link relative to top directory (top tree);
4545 # return undef if it is not possible (including absolute links).
4546 sub normalize_link_target {
4547         my ($link_target, $basedir) = @_;
4548
4549         # absolute symlinks (beginning with '/') cannot be normalized
4550         return if (substr($link_target, 0, 1) eq '/');
4551
4552         # normalize link target to path from top (root) tree (dir)
4553         my $path;
4554         if ($basedir) {
4555                 $path = $basedir . '/' . $link_target;
4556         } else {
4557                 # we are in top (root) tree (dir)
4558                 $path = $link_target;
4559         }
4560
4561         # remove //, /./, and /../
4562         my @path_parts;
4563         foreach my $part (split('/', $path)) {
4564                 # discard '.' and ''
4565                 next if (!$part || $part eq '.');
4566                 # handle '..'
4567                 if ($part eq '..') {
4568                         if (@path_parts) {
4569                                 pop @path_parts;
4570                         } else {
4571                                 # link leads outside repository (outside top dir)
4572                                 return;
4573                         }
4574                 } else {
4575                         push @path_parts, $part;
4576                 }
4577         }
4578         $path = join('/', @path_parts);
4579
4580         return $path;
4581 }
4582
4583 # print tree entry (row of git_tree), but without encompassing <tr> element
4584 sub git_print_tree_entry {
4585         my ($t, $basedir, $hash_base, $have_blame) = @_;
4586
4587         my %base_key = ();
4588         $base_key{'hash_base'} = $hash_base if defined $hash_base;
4589
4590         # The format of a table row is: mode list link.  Where mode is
4591         # the mode of the entry, list is the name of the entry, an href,
4592         # and link is the action links of the entry.
4593
4594         print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4595         if (exists $t->{'size'}) {
4596                 print "<td class=\"size\">$t->{'size'}</td>\n";
4597         }
4598         if ($t->{'type'} eq "blob") {
4599                 print "<td class=\"list\">" .
4600                         $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4601                                                file_name=>"$basedir$t->{'name'}", %base_key),
4602                                 -class => "list"}, esc_path($t->{'name'}));
4603                 if (S_ISLNK(oct $t->{'mode'})) {
4604                         my $link_target = git_get_link_target($t->{'hash'});
4605                         if ($link_target) {
4606                                 my $norm_target = normalize_link_target($link_target, $basedir);
4607                                 if (defined $norm_target) {
4608                                         print " -> " .
4609                                               $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4610                                                                      file_name=>$norm_target),
4611                                                        -title => $norm_target}, esc_path($link_target));
4612                                 } else {
4613                                         print " -> " . esc_path($link_target);
4614                                 }
4615                         }
4616                 }
4617                 print "</td>\n";
4618                 print "<td class=\"link\">";
4619                 print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4620                                              file_name=>"$basedir$t->{'name'}", %base_key)},
4621                               "blob");
4622                 if ($have_blame) {
4623                         print " | " .
4624                               $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4625                                                      file_name=>"$basedir$t->{'name'}", %base_key)},
4626                                       "blame");
4627                 }
4628                 if (defined $hash_base) {
4629                         print " | " .
4630                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4631                                                      hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4632                                       "history");
4633                 }
4634                 print " | " .
4635                         $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4636                                                file_name=>"$basedir$t->{'name'}")},
4637                                 "raw");
4638                 print "</td>\n";
4639
4640         } elsif ($t->{'type'} eq "tree") {
4641                 print "<td class=\"list\">";
4642                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4643                                              file_name=>"$basedir$t->{'name'}",
4644                                              %base_key)},
4645                               esc_path($t->{'name'}));
4646                 print "</td>\n";
4647                 print "<td class=\"link\">";
4648                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4649                                              file_name=>"$basedir$t->{'name'}",
4650                                              %base_key)},
4651                               "tree");
4652                 if (defined $hash_base) {
4653                         print " | " .
4654                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4655                                                      file_name=>"$basedir$t->{'name'}")},
4656                                       "history");
4657                 }
4658                 print "</td>\n";
4659         } else {
4660                 # unknown object: we can only present history for it
4661                 # (this includes 'commit' object, i.e. submodule support)
4662                 print "<td class=\"list\">" .
4663                       esc_path($t->{'name'}) .
4664                       "</td>\n";
4665                 print "<td class=\"link\">";
4666                 if (defined $hash_base) {
4667                         print $cgi->a({-href => href(action=>"history",
4668                                                      hash_base=>$hash_base,
4669                                                      file_name=>"$basedir$t->{'name'}")},
4670                                       "history");
4671                 }
4672                 print "</td>\n";
4673         }
4674 }
4675
4676 ## ......................................................................
4677 ## functions printing large fragments of HTML
4678
4679 # get pre-image filenames for merge (combined) diff
4680 sub fill_from_file_info {
4681         my ($diff, @parents) = @_;
4682
4683         $diff->{'from_file'} = [ ];
4684         $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4685         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4686                 if ($diff->{'status'}[$i] eq 'R' ||
4687                     $diff->{'status'}[$i] eq 'C') {
4688                         $diff->{'from_file'}[$i] =
4689                                 git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4690                 }
4691         }
4692
4693         return $diff;
4694 }
4695
4696 # is current raw difftree line of file deletion
4697 sub is_deleted {
4698         my $diffinfo = shift;
4699
4700         return $diffinfo->{'to_id'} eq ('0' x 40);
4701 }
4702
4703 # does patch correspond to [previous] difftree raw line
4704 # $diffinfo  - hashref of parsed raw diff format
4705 # $patchinfo - hashref of parsed patch diff format
4706 #              (the same keys as in $diffinfo)
4707 sub is_patch_split {
4708         my ($diffinfo, $patchinfo) = @_;
4709
4710         return defined $diffinfo && defined $patchinfo
4711                 && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4712 }
4713
4714
4715 sub git_difftree_body {
4716         my ($difftree, $hash, @parents) = @_;
4717         my ($parent) = $parents[0];
4718         my $have_blame = gitweb_check_feature('blame');
4719         print "<div class=\"list_head\">\n";
4720         if ($#{$difftree} > 10) {
4721                 print(($#{$difftree} + 1) . " files changed:\n");
4722         }
4723         print "</div>\n";
4724
4725         print "<table class=\"" .
4726               (@parents > 1 ? "combined " : "") .
4727               "diff_tree\">\n";
4728
4729         # header only for combined diff in 'commitdiff' view
4730         my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4731         if ($has_header) {
4732                 # table header
4733                 print "<thead><tr>\n" .
4734                        "<th></th><th></th>\n"; # filename, patchN link
4735                 for (my $i = 0; $i < @parents; $i++) {
4736                         my $par = $parents[$i];
4737                         print "<th>" .
4738                               $cgi->a({-href => href(action=>"commitdiff",
4739                                                      hash=>$hash, hash_parent=>$par),
4740                                        -title => 'commitdiff to parent number ' .
4741                                                   ($i+1) . ': ' . substr($par,0,7)},
4742                                       $i+1) .
4743                               "&nbsp;</th>\n";
4744                 }
4745                 print "</tr></thead>\n<tbody>\n";
4746         }
4747
4748         my $alternate = 1;
4749         my $patchno = 0;
4750         foreach my $line (@{$difftree}) {
4751                 my $diff = parsed_difftree_line($line);
4752
4753                 if ($alternate) {
4754                         print "<tr class=\"dark\">\n";
4755                 } else {
4756                         print "<tr class=\"light\">\n";
4757                 }
4758                 $alternate ^= 1;
4759
4760                 if (exists $diff->{'nparents'}) { # combined diff
4761
4762                         fill_from_file_info($diff, @parents)
4763                                 unless exists $diff->{'from_file'};
4764
4765                         if (!is_deleted($diff)) {
4766                                 # file exists in the result (child) commit
4767                                 print "<td>" .
4768                                       $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4769                                                              file_name=>$diff->{'to_file'},
4770                                                              hash_base=>$hash),
4771                                               -class => "list"}, esc_path($diff->{'to_file'})) .
4772                                       "</td>\n";
4773                         } else {
4774                                 print "<td>" .
4775                                       esc_path($diff->{'to_file'}) .
4776                                       "</td>\n";
4777                         }
4778
4779                         if ($action eq 'commitdiff') {
4780                                 # link to patch
4781                                 $patchno++;
4782                                 print "<td class=\"link\">" .
4783                                       $cgi->a({-href => href(-anchor=>"patch$patchno")},
4784                                               "patch") .
4785                                       " | " .
4786                                       "</td>\n";
4787                         }
4788
4789                         my $has_history = 0;
4790                         my $not_deleted = 0;
4791                         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4792                                 my $hash_parent = $parents[$i];
4793                                 my $from_hash = $diff->{'from_id'}[$i];
4794                                 my $from_path = $diff->{'from_file'}[$i];
4795                                 my $status = $diff->{'status'}[$i];
4796
4797                                 $has_history ||= ($status ne 'A');
4798                                 $not_deleted ||= ($status ne 'D');
4799
4800                                 if ($status eq 'A') {
4801                                         print "<td  class=\"link\" align=\"right\"> | </td>\n";
4802                                 } elsif ($status eq 'D') {
4803                                         print "<td class=\"link\">" .
4804                                               $cgi->a({-href => href(action=>"blob",
4805                                                                      hash_base=>$hash,
4806                                                                      hash=>$from_hash,
4807                                                                      file_name=>$from_path)},
4808                                                       "blob" . ($i+1)) .
4809                                               " | </td>\n";
4810                                 } else {
4811                                         if ($diff->{'to_id'} eq $from_hash) {
4812                                                 print "<td class=\"link nochange\">";
4813                                         } else {
4814                                                 print "<td class=\"link\">";
4815                                         }
4816                                         print $cgi->a({-href => href(action=>"blobdiff",
4817                                                                      hash=>$diff->{'to_id'},
4818                                                                      hash_parent=>$from_hash,
4819                                                                      hash_base=>$hash,
4820                                                                      hash_parent_base=>$hash_parent,
4821                                                                      file_name=>$diff->{'to_file'},
4822                                                                      file_parent=>$from_path)},
4823                                                       "diff" . ($i+1)) .
4824                                               " | </td>\n";
4825                                 }
4826                         }
4827
4828                         print "<td class=\"link\">";
4829                         if ($not_deleted) {
4830                                 print $cgi->a({-href => href(action=>"blob",
4831                                                              hash=>$diff->{'to_id'},
4832                                                              file_name=>$diff->{'to_file'},
4833                                                              hash_base=>$hash)},
4834                                               "blob");
4835                                 print " | " if ($has_history);
4836                         }
4837                         if ($has_history) {
4838                                 print $cgi->a({-href => href(action=>"history",
4839                                                              file_name=>$diff->{'to_file'},
4840                                                              hash_base=>$hash)},
4841                                               "history");
4842                         }
4843                         print "</td>\n";
4844
4845                         print "</tr>\n";
4846                         next; # instead of 'else' clause, to avoid extra indent
4847                 }
4848                 # else ordinary diff
4849
4850                 my ($to_mode_oct, $to_mode_str, $to_file_type);
4851                 my ($from_mode_oct, $from_mode_str, $from_file_type);
4852                 if ($diff->{'to_mode'} ne ('0' x 6)) {
4853                         $to_mode_oct = oct $diff->{'to_mode'};
4854                         if (S_ISREG($to_mode_oct)) { # only for regular file
4855                                 $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4856                         }
4857                         $to_file_type = file_type($diff->{'to_mode'});
4858                 }
4859                 if ($diff->{'from_mode'} ne ('0' x 6)) {
4860                         $from_mode_oct = oct $diff->{'from_mode'};
4861                         if (S_ISREG($from_mode_oct)) { # only for regular file
4862                                 $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4863                         }
4864                         $from_file_type = file_type($diff->{'from_mode'});
4865                 }
4866
4867                 if ($diff->{'status'} eq "A") { # created
4868                         my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4869                         $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4870                         $mode_chng   .= "]</span>";
4871                         print "<td>";
4872                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4873                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4874                                       -class => "list"}, esc_path($diff->{'file'}));
4875                         print "</td>\n";
4876                         print "<td>$mode_chng</td>\n";
4877                         print "<td class=\"link\">";
4878                         if ($action eq 'commitdiff') {
4879                                 # link to patch
4880                                 $patchno++;
4881                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4882                                               "patch") .
4883                                       " | ";
4884                         }
4885                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4886                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4887                                       "blob");
4888                         print "</td>\n";
4889
4890                 } elsif ($diff->{'status'} eq "D") { # deleted
4891                         my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4892                         print "<td>";
4893                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4894                                                      hash_base=>$parent, file_name=>$diff->{'file'}),
4895                                        -class => "list"}, esc_path($diff->{'file'}));
4896                         print "</td>\n";
4897                         print "<td>$mode_chng</td>\n";
4898                         print "<td class=\"link\">";
4899                         if ($action eq 'commitdiff') {
4900                                 # link to patch
4901                                 $patchno++;
4902                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4903                                               "patch") .
4904                                       " | ";
4905                         }
4906                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4907                                                      hash_base=>$parent, file_name=>$diff->{'file'})},
4908                                       "blob") . " | ";
4909                         if ($have_blame) {
4910                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4911                                                              file_name=>$diff->{'file'})},
4912                                               "blame") . " | ";
4913                         }
4914                         print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4915                                                      file_name=>$diff->{'file'})},
4916                                       "history");
4917                         print "</td>\n";
4918
4919                 } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4920                         my $mode_chnge = "";
4921                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4922                                 $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4923                                 if ($from_file_type ne $to_file_type) {
4924                                         $mode_chnge .= " from $from_file_type to $to_file_type";
4925                                 }
4926                                 if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4927                                         if ($from_mode_str && $to_mode_str) {
4928                                                 $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4929                                         } elsif ($to_mode_str) {
4930                                                 $mode_chnge .= " mode: $to_mode_str";
4931                                         }
4932                                 }
4933                                 $mode_chnge .= "]</span>\n";
4934                         }
4935                         print "<td>";
4936                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4937                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4938                                       -class => "list"}, esc_path($diff->{'file'}));
4939                         print "</td>\n";
4940                         print "<td>$mode_chnge</td>\n";
4941                         print "<td class=\"link\">";
4942                         if ($action eq 'commitdiff') {
4943                                 # link to patch
4944                                 $patchno++;
4945                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4946                                               "patch") .
4947                                       " | ";
4948                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4949                                 # "commit" view and modified file (not onlu mode changed)
4950                                 print $cgi->a({-href => href(action=>"blobdiff",
4951                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4952                                                              hash_base=>$hash, hash_parent_base=>$parent,
4953                                                              file_name=>$diff->{'file'})},
4954                                               "diff") .
4955                                       " | ";
4956                         }
4957                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4958                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4959                                        "blob") . " | ";
4960                         if ($have_blame) {
4961                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4962                                                              file_name=>$diff->{'file'})},
4963                                               "blame") . " | ";
4964                         }
4965                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4966                                                      file_name=>$diff->{'file'})},
4967                                       "history");
4968                         print "</td>\n";
4969
4970                 } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4971                         my %status_name = ('R' => 'moved', 'C' => 'copied');
4972                         my $nstatus = $status_name{$diff->{'status'}};
4973                         my $mode_chng = "";
4974                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4975                                 # mode also for directories, so we cannot use $to_mode_str
4976                                 $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4977                         }
4978                         print "<td>" .
4979                               $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4980                                                      hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4981                                       -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4982                               "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4983                               $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4984                                                      hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4985                                       -class => "list"}, esc_path($diff->{'from_file'})) .
4986                               " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4987                               "<td class=\"link\">";
4988                         if ($action eq 'commitdiff') {
4989                                 # link to patch
4990                                 $patchno++;
4991                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4992                                               "patch") .
4993                                       " | ";
4994                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4995                                 # "commit" view and modified file (not only pure rename or copy)
4996                                 print $cgi->a({-href => href(action=>"blobdiff",
4997                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4998                                                              hash_base=>$hash, hash_parent_base=>$parent,
4999                                                              file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
5000                                               "diff") .
5001                                       " | ";
5002                         }
5003                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
5004                                                      hash_base=>$parent, file_name=>$diff->{'to_file'})},
5005                                       "blob") . " | ";
5006                         if ($have_blame) {
5007                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
5008                                                              file_name=>$diff->{'to_file'})},
5009                                               "blame") . " | ";
5010                         }
5011                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
5012                                                     file_name=>$diff->{'to_file'})},
5013                                       "history");
5014                         print "</td>\n";
5015
5016                 } # we should not encounter Unmerged (U) or Unknown (X) status
5017                 print "</tr>\n";
5018         }
5019         print "</tbody>" if $has_header;
5020         print "</table>\n";
5021 }
5022
5023 # Print context lines and then rem/add lines in a side-by-side manner.
5024 sub print_sidebyside_diff_lines {
5025         my ($ctx, $rem, $add) = @_;
5026
5027         # print context block before add/rem block
5028         if (@$ctx) {
5029                 print join '',
5030                         '<div class="chunk_block ctx">',
5031                                 '<div class="old">',
5032                                 @$ctx,
5033                                 '</div>',
5034                                 '<div class="new">',
5035                                 @$ctx,
5036                                 '</div>',
5037                         '</div>';
5038         }
5039
5040         if (!@$add) {
5041                 # pure removal
5042                 print join '',
5043                         '<div class="chunk_block rem">',
5044                                 '<div class="old">',
5045                                 @$rem,
5046                                 '</div>',
5047                         '</div>';
5048         } elsif (!@$rem) {
5049                 # pure addition
5050                 print join '',
5051                         '<div class="chunk_block add">',
5052                                 '<div class="new">',
5053                                 @$add,
5054                                 '</div>',
5055                         '</div>';
5056         } else {
5057                 print join '',
5058                         '<div class="chunk_block chg">',
5059                                 '<div class="old">',
5060                                 @$rem,
5061                                 '</div>',
5062                                 '<div class="new">',
5063                                 @$add,
5064                                 '</div>',
5065                         '</div>';
5066         }
5067 }
5068
5069 # Print context lines and then rem/add lines in inline manner.
5070 sub print_inline_diff_lines {
5071         my ($ctx, $rem, $add) = @_;
5072
5073         print @$ctx, @$rem, @$add;
5074 }
5075
5076 # Format removed and added line, mark changed part and HTML-format them.
5077 # Implementation is based on contrib/diff-highlight
5078 sub format_rem_add_lines_pair {
5079         my ($rem, $add, $num_parents) = @_;
5080
5081         # We need to untabify lines before split()'ing them;
5082         # otherwise offsets would be invalid.
5083         chomp $rem;
5084         chomp $add;
5085         $rem = untabify($rem);
5086         $add = untabify($add);
5087
5088         my @rem = split(//, $rem);
5089         my @add = split(//, $add);
5090         my ($esc_rem, $esc_add);
5091         # Ignore leading +/- characters for each parent.
5092         my ($prefix_len, $suffix_len) = ($num_parents, 0);
5093         my ($prefix_has_nonspace, $suffix_has_nonspace);
5094
5095         my $shorter = (@rem < @add) ? @rem : @add;
5096         while ($prefix_len < $shorter) {
5097                 last if ($rem[$prefix_len] ne $add[$prefix_len]);
5098
5099                 $prefix_has_nonspace = 1 if ($rem[$prefix_len] !~ /\s/);
5100                 $prefix_len++;
5101         }
5102
5103         while ($prefix_len + $suffix_len < $shorter) {
5104                 last if ($rem[-1 - $suffix_len] ne $add[-1 - $suffix_len]);
5105
5106                 $suffix_has_nonspace = 1 if ($rem[-1 - $suffix_len] !~ /\s/);
5107                 $suffix_len++;
5108         }
5109
5110         # Mark lines that are different from each other, but have some common
5111         # part that isn't whitespace.  If lines are completely different, don't
5112         # mark them because that would make output unreadable, especially if
5113         # diff consists of multiple lines.
5114         if ($prefix_has_nonspace || $suffix_has_nonspace) {
5115                 $esc_rem = esc_html_hl_regions($rem, 'marked',
5116                         [$prefix_len, @rem - $suffix_len], -nbsp=>1);
5117                 $esc_add = esc_html_hl_regions($add, 'marked',
5118                         [$prefix_len, @add - $suffix_len], -nbsp=>1);
5119         } else {
5120                 $esc_rem = esc_html($rem, -nbsp=>1);
5121                 $esc_add = esc_html($add, -nbsp=>1);
5122         }
5123
5124         return format_diff_line(\$esc_rem, 'rem'),
5125                format_diff_line(\$esc_add, 'add');
5126 }
5127
5128 # HTML-format diff context, removed and added lines.
5129 sub format_ctx_rem_add_lines {
5130         my ($ctx, $rem, $add, $num_parents) = @_;
5131         my (@new_ctx, @new_rem, @new_add);
5132         my $can_highlight = 0;
5133         my $is_combined = ($num_parents > 1);
5134
5135         # Highlight if every removed line has a corresponding added line.
5136         if (@$add > 0 && @$add == @$rem) {
5137                 $can_highlight = 1;
5138
5139                 # Highlight lines in combined diff only if the chunk contains
5140                 # diff between the same version, e.g.
5141                 #
5142                 #    - a
5143                 #   -  b
5144                 #    + c
5145                 #   +  d
5146                 #
5147                 # Otherwise the highlightling would be confusing.
5148                 if ($is_combined) {
5149                         for (my $i = 0; $i < @$add; $i++) {
5150                                 my $prefix_rem = substr($rem->[$i], 0, $num_parents);
5151                                 my $prefix_add = substr($add->[$i], 0, $num_parents);
5152
5153                                 $prefix_rem =~ s/-/+/g;
5154
5155                                 if ($prefix_rem ne $prefix_add) {
5156                                         $can_highlight = 0;
5157                                         last;
5158                                 }
5159                         }
5160                 }
5161         }
5162
5163         if ($can_highlight) {
5164                 for (my $i = 0; $i < @$add; $i++) {
5165                         my ($line_rem, $line_add) = format_rem_add_lines_pair(
5166                                 $rem->[$i], $add->[$i], $num_parents);
5167                         push @new_rem, $line_rem;
5168                         push @new_add, $line_add;
5169                 }
5170         } else {
5171                 @new_rem = map { format_diff_line($_, 'rem') } @$rem;
5172                 @new_add = map { format_diff_line($_, 'add') } @$add;
5173         }
5174
5175         @new_ctx = map { format_diff_line($_, 'ctx') } @$ctx;
5176
5177         return (\@new_ctx, \@new_rem, \@new_add);
5178 }
5179
5180 # Print context lines and then rem/add lines.
5181 sub print_diff_lines {
5182         my ($ctx, $rem, $add, $diff_style, $num_parents) = @_;
5183         my $is_combined = $num_parents > 1;
5184
5185         ($ctx, $rem, $add) = format_ctx_rem_add_lines($ctx, $rem, $add,
5186                 $num_parents);
5187
5188         if ($diff_style eq 'sidebyside' && !$is_combined) {
5189                 print_sidebyside_diff_lines($ctx, $rem, $add);
5190         } else {
5191                 # default 'inline' style and unknown styles
5192                 print_inline_diff_lines($ctx, $rem, $add);
5193         }
5194 }
5195
5196 sub print_diff_chunk {
5197         my ($diff_style, $num_parents, $from, $to, @chunk) = @_;
5198         my (@ctx, @rem, @add);
5199
5200         # The class of the previous line.
5201         my $prev_class = '';
5202
5203         return unless @chunk;
5204
5205         # incomplete last line might be among removed or added lines,
5206         # or both, or among context lines: find which
5207         for (my $i = 1; $i < @chunk; $i++) {
5208                 if ($chunk[$i][0] eq 'incomplete') {
5209                         $chunk[$i][0] = $chunk[$i-1][0];
5210                 }
5211         }
5212
5213         # guardian
5214         push @chunk, ["", ""];
5215
5216         foreach my $line_info (@chunk) {
5217                 my ($class, $line) = @$line_info;
5218
5219                 # print chunk headers
5220                 if ($class && $class eq 'chunk_header') {
5221                         print format_diff_line($line, $class, $from, $to);
5222                         next;
5223                 }
5224
5225                 ## print from accumulator when have some add/rem lines or end
5226                 # of chunk (flush context lines), or when have add and rem
5227                 # lines and new block is reached (otherwise add/rem lines could
5228                 # be reordered)
5229                 if (!$class || ((@rem || @add) && $class eq 'ctx') ||
5230                     (@rem && @add && $class ne $prev_class)) {
5231                         print_diff_lines(\@ctx, \@rem, \@add,
5232                                          $diff_style, $num_parents);
5233                         @ctx = @rem = @add = ();
5234                 }
5235
5236                 ## adding lines to accumulator
5237                 # guardian value
5238                 last unless $line;
5239                 # rem, add or change
5240                 if ($class eq 'rem') {
5241                         push @rem, $line;
5242                 } elsif ($class eq 'add') {
5243                         push @add, $line;
5244                 }
5245                 # context line
5246                 if ($class eq 'ctx') {
5247                         push @ctx, $line;
5248                 }
5249
5250                 $prev_class = $class;
5251         }
5252 }
5253
5254 sub git_patchset_body {
5255         my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
5256         my ($hash_parent) = $hash_parents[0];
5257
5258         my $is_combined = (@hash_parents > 1);
5259         my $patch_idx = 0;
5260         my $patch_number = 0;
5261         my $patch_line;
5262         my $diffinfo;
5263         my $to_name;
5264         my (%from, %to);
5265         my @chunk; # for side-by-side diff
5266
5267         print "<div class=\"patchset\">\n";
5268
5269         # skip to first patch
5270         while ($patch_line = <$fd>) {
5271                 chomp $patch_line;
5272
5273                 last if ($patch_line =~ m/^diff /);
5274         }
5275
5276  PATCH:
5277         while ($patch_line) {
5278
5279                 # parse "git diff" header line
5280                 if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
5281                         # $1 is from_name, which we do not use
5282                         $to_name = unquote($2);
5283                         $to_name =~ s!^b/!!;
5284                 } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
5285                         # $1 is 'cc' or 'combined', which we do not use
5286                         $to_name = unquote($2);
5287                 } else {
5288                         $to_name = undef;
5289                 }
5290
5291                 # check if current patch belong to current raw line
5292                 # and parse raw git-diff line if needed
5293                 if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
5294                         # this is continuation of a split patch
5295                         print "<div class=\"patch cont\">\n";
5296                 } else {
5297                         # advance raw git-diff output if needed
5298                         $patch_idx++ if defined $diffinfo;
5299
5300                         # read and prepare patch information
5301                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5302
5303                         # compact combined diff output can have some patches skipped
5304                         # find which patch (using pathname of result) we are at now;
5305                         if ($is_combined) {
5306                                 while ($to_name ne $diffinfo->{'to_file'}) {
5307                                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5308                                               format_diff_cc_simplified($diffinfo, @hash_parents) .
5309                                               "</div>\n";  # class="patch"
5310
5311                                         $patch_idx++;
5312                                         $patch_number++;
5313
5314                                         last if $patch_idx > $#$difftree;
5315                                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5316                                 }
5317                         }
5318
5319                         # modifies %from, %to hashes
5320                         parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5321
5322                         # this is first patch for raw difftree line with $patch_idx index
5323                         # we index @$difftree array from 0, but number patches from 1
5324                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5325                 }
5326
5327                 # git diff header
5328                 #assert($patch_line =~ m/^diff /) if DEBUG;
5329                 #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5330                 $patch_number++;
5331                 # print "git diff" header
5332                 print format_git_diff_header_line($patch_line, $diffinfo,
5333                                                   \%from, \%to);
5334
5335                 # print extended diff header
5336                 print "<div class=\"diff extended_header\">\n";
5337         EXTENDED_HEADER:
5338                 while ($patch_line = <$fd>) {
5339                         chomp $patch_line;
5340
5341                         last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5342
5343                         print format_extended_diff_header_line($patch_line, $diffinfo,
5344                                                                \%from, \%to);
5345                 }
5346                 print "</div>\n"; # class="diff extended_header"
5347
5348                 # from-file/to-file diff header
5349                 if (! $patch_line) {
5350                         print "</div>\n"; # class="patch"
5351                         last PATCH;
5352                 }
5353                 next PATCH if ($patch_line =~ m/^diff /);
5354                 #assert($patch_line =~ m/^---/) if DEBUG;
5355
5356                 my $last_patch_line = $patch_line;
5357                 $patch_line = <$fd>;
5358                 chomp $patch_line;
5359                 #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5360
5361                 print format_diff_from_to_header($last_patch_line, $patch_line,
5362                                                  $diffinfo, \%from, \%to,
5363                                                  @hash_parents);
5364
5365                 # the patch itself
5366         LINE:
5367                 while ($patch_line = <$fd>) {
5368                         chomp $patch_line;
5369
5370                         next PATCH if ($patch_line =~ m/^diff /);
5371
5372                         my $class = diff_line_class($patch_line, \%from, \%to);
5373
5374                         if ($class eq 'chunk_header') {
5375                                 print_diff_chunk($diff_style, scalar @hash_parents, \%from, \%to, @chunk);
5376                                 @chunk = ();
5377                         }
5378
5379                         push @chunk, [ $class, $patch_line ];
5380                 }
5381
5382         } continue {
5383                 if (@chunk) {
5384                         print_diff_chunk($diff_style, scalar @hash_parents, \%from, \%to, @chunk);
5385                         @chunk = ();
5386                 }
5387                 print "</div>\n"; # class="patch"
5388         }
5389
5390         # for compact combined (--cc) format, with chunk and patch simplification
5391         # the patchset might be empty, but there might be unprocessed raw lines
5392         for (++$patch_idx if $patch_number > 0;
5393              $patch_idx < @$difftree;
5394              ++$patch_idx) {
5395                 # read and prepare patch information
5396                 $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5397
5398                 # generate anchor for "patch" links in difftree / whatchanged part
5399                 print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5400                       format_diff_cc_simplified($diffinfo, @hash_parents) .
5401                       "</div>\n";  # class="patch"
5402
5403                 $patch_number++;
5404         }
5405
5406         if ($patch_number == 0) {
5407                 if (@hash_parents > 1) {
5408                         print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5409                 } else {
5410                         print "<div class=\"diff nodifferences\">No differences found</div>\n";
5411                 }
5412         }
5413
5414         print "</div>\n"; # class="patchset"
5415 }
5416
5417 # . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5418
5419 sub git_project_search_form {
5420         my ($searchtext, $search_use_regexp) = @_;
5421
5422         my $limit = '';
5423         if ($project_filter) {
5424                 $limit = " in '$project_filter/'";
5425         }
5426
5427         print "<div class=\"projsearch\">\n";
5428         print $cgi->startform(-method => 'get', -action => $my_uri) .
5429               $cgi->hidden(-name => 'a', -value => 'project_list')  . "\n";
5430         print $cgi->hidden(-name => 'pf', -value => $project_filter). "\n"
5431                 if (defined $project_filter);
5432         print $cgi->textfield(-name => 's', -value => $searchtext,
5433                               -title => "Search project by name and description$limit",
5434                               -size => 60) . "\n" .
5435               "<span title=\"Extended regular expression\">" .
5436               $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
5437                              -checked => $search_use_regexp) .
5438               "</span>\n" .
5439               $cgi->submit(-name => 'btnS', -value => 'Search') .
5440               $cgi->end_form() . "\n" .
5441               $cgi->a({-href => href(project => undef, searchtext => undef,
5442                                      project_filter => $project_filter)},
5443                       esc_html("List all projects$limit")) . "<br />\n";
5444         print "</div>\n";
5445 }
5446
5447 # entry for given @keys needs filling if at least one of keys in list
5448 # is not present in %$project_info
5449 sub project_info_needs_filling {
5450         my ($project_info, @keys) = @_;
5451
5452         # return List::MoreUtils::any { !exists $project_info->{$_} } @keys;
5453         foreach my $key (@keys) {
5454                 if (!exists $project_info->{$key}) {
5455                         return 1;
5456                 }
5457         }
5458         return;
5459 }
5460
5461 # fills project list info (age, description, owner, category, forks, etc.)
5462 # for each project in the list, removing invalid projects from
5463 # returned list, or fill only specified info.
5464 #
5465 # Invalid projects are removed from the returned list if and only if you
5466 # ask 'age' or 'age_string' to be filled, because they are the only fields
5467 # that run unconditionally git command that requires repository, and
5468 # therefore do always check if project repository is invalid.
5469 #
5470 # USAGE:
5471 # * fill_project_list_info(\@project_list, 'descr_long', 'ctags')
5472 #   ensures that 'descr_long' and 'ctags' fields are filled
5473 # * @project_list = fill_project_list_info(\@project_list)
5474 #   ensures that all fields are filled (and invalid projects removed)
5475 #
5476 # NOTE: modifies $projlist, but does not remove entries from it
5477 sub fill_project_list_info {
5478         my ($projlist, @wanted_keys) = @_;
5479         my @projects;
5480         my $filter_set = sub { return @_; };
5481         if (@wanted_keys) {
5482                 my %wanted_keys = map { $_ => 1 } @wanted_keys;
5483                 $filter_set = sub { return grep { $wanted_keys{$_} } @_; };
5484         }
5485
5486         my $show_ctags = gitweb_check_feature('ctags');
5487  PROJECT:
5488         foreach my $pr (@$projlist) {
5489                 if (project_info_needs_filling($pr, $filter_set->('age', 'age_string'))) {
5490                         my (@activity) = git_get_last_activity($pr->{'path'});
5491                         unless (@activity) {
5492                                 next PROJECT;
5493                         }
5494                         ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5495                 }
5496                 if (project_info_needs_filling($pr, $filter_set->('descr', 'descr_long'))) {
5497                         my $descr = git_get_project_description($pr->{'path'}) || "";
5498                         $descr = to_utf8($descr);
5499                         $pr->{'descr_long'} = $descr;
5500                         $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5501                 }
5502                 if (project_info_needs_filling($pr, $filter_set->('owner'))) {
5503                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5504                 }
5505                 if ($show_ctags &&
5506                     project_info_needs_filling($pr, $filter_set->('ctags'))) {
5507                         $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5508                 }
5509                 if ($projects_list_group_categories &&
5510                     project_info_needs_filling($pr, $filter_set->('category'))) {
5511                         my $cat = git_get_project_category($pr->{'path'}) ||
5512                                                            $project_list_default_category;
5513                         $pr->{'category'} = to_utf8($cat);
5514                 }
5515
5516                 push @projects, $pr;
5517         }
5518
5519         return @projects;
5520 }
5521
5522 sub sort_projects_list {
5523         my ($projlist, $order) = @_;
5524         my @projects;
5525
5526         my %order_info = (
5527                 project => { key => 'path', type => 'str' },
5528                 descr => { key => 'descr_long', type => 'str' },
5529                 owner => { key => 'owner', type => 'str' },
5530                 age => { key => 'age', type => 'num' }
5531         );
5532         my $oi = $order_info{$order};
5533         return @$projlist unless defined $oi;
5534         if ($oi->{'type'} eq 'str') {
5535                 @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5536         } else {
5537                 @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5538         }
5539
5540         return @projects;
5541 }
5542
5543 # returns a hash of categories, containing the list of project
5544 # belonging to each category
5545 sub build_projlist_by_category {
5546         my ($projlist, $from, $to) = @_;
5547         my %categories;
5548
5549         $from = 0 unless defined $from;
5550         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5551
5552         for (my $i = $from; $i <= $to; $i++) {
5553                 my $pr = $projlist->[$i];
5554                 push @{$categories{ $pr->{'category'} }}, $pr;
5555         }
5556
5557         return wantarray ? %categories : \%categories;
5558 }
5559
5560 # print 'sort by' <th> element, generating 'sort by $name' replay link
5561 # if that order is not selected
5562 sub print_sort_th {
5563         print format_sort_th(@_);
5564 }
5565
5566 sub format_sort_th {
5567         my ($name, $order, $header) = @_;
5568         my $sort_th = "";
5569         $header ||= ucfirst($name);
5570
5571         if ($order eq $name) {
5572                 $sort_th .= "<th>$header</th>\n";
5573         } else {
5574                 $sort_th .= "<th>" .
5575                             $cgi->a({-href => href(-replay=>1, order=>$name),
5576                                      -class => "header"}, $header) .
5577                             "</th>\n";
5578         }
5579
5580         return $sort_th;
5581 }
5582
5583 sub git_project_list_rows {
5584         my ($projlist, $from, $to, $check_forks) = @_;
5585
5586         $from = 0 unless defined $from;
5587         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5588
5589         my $alternate = 1;
5590         for (my $i = $from; $i <= $to; $i++) {
5591                 my $pr = $projlist->[$i];
5592
5593                 if ($alternate) {
5594                         print "<tr class=\"dark\">\n";
5595                 } else {
5596                         print "<tr class=\"light\">\n";
5597                 }
5598                 $alternate ^= 1;
5599
5600                 if ($check_forks) {
5601                         print "<td>";
5602                         if ($pr->{'forks'}) {
5603                                 my $nforks = scalar @{$pr->{'forks'}};
5604                                 if ($nforks > 0) {
5605                                         print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5606                                                        -title => "$nforks forks"}, "+");
5607                                 } else {
5608                                         print $cgi->span({-title => "$nforks forks"}, "+");
5609                                 }
5610                         }
5611                         print "</td>\n";
5612                 }
5613                 print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5614                                         -class => "list"},
5615                                        esc_html_match_hl($pr->{'path'}, $search_regexp)) .
5616                       "</td>\n" .
5617                       "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5618                                         -class => "list",
5619                                         -title => $pr->{'descr_long'}},
5620                                         $search_regexp
5621                                         ? esc_html_match_hl_chopped($pr->{'descr_long'},
5622                                                                     $pr->{'descr'}, $search_regexp)
5623                                         : esc_html($pr->{'descr'})) .
5624                       "</td>\n";
5625                 unless ($omit_owner) {
5626                         print "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5627                 }
5628                 unless ($omit_age_column) {
5629                         print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5630                             (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n";
5631                 }
5632                 print"<td class=\"link\">" .
5633                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5634                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5635                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5636                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5637                       ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5638                       "</td>\n" .
5639                       "</tr>\n";
5640         }
5641 }
5642
5643 sub git_project_list_body {
5644         # actually uses global variable $project
5645         my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5646         my @projects = @$projlist;
5647
5648         my $check_forks = gitweb_check_feature('forks');
5649         my $show_ctags  = gitweb_check_feature('ctags');
5650         my $tagfilter = $show_ctags ? $input_params{'ctag'} : undef;
5651         $check_forks = undef
5652                 if ($tagfilter || $search_regexp);
5653
5654         # filtering out forks before filling info allows to do less work
5655         @projects = filter_forks_from_projects_list(\@projects)
5656                 if ($check_forks);
5657         # search_projects_list pre-fills required info
5658         @projects = search_projects_list(\@projects,
5659                                          'search_regexp' => $search_regexp,
5660                                          'tagfilter'  => $tagfilter)
5661                 if ($tagfilter || $search_regexp);
5662         # fill the rest
5663         my @all_fields = ('descr', 'descr_long', 'ctags', 'category');
5664         push @all_fields, ('age', 'age_string') unless($omit_age_column);
5665         push @all_fields, 'owner' unless($omit_owner);
5666         @projects = fill_project_list_info(\@projects, @all_fields);
5667
5668         $order ||= $default_projects_order;
5669         $from = 0 unless defined $from;
5670         $to = $#projects if (!defined $to || $#projects < $to);
5671
5672         # short circuit
5673         if ($from > $to) {
5674                 print "<center>\n".
5675                       "<b>No such projects found</b><br />\n".
5676                       "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5677                       "</center>\n<br />\n";
5678                 return;
5679         }
5680
5681         @projects = sort_projects_list(\@projects, $order);
5682
5683         if ($show_ctags) {
5684                 my $ctags = git_gather_all_ctags(\@projects);
5685                 my $cloud = git_populate_project_tagcloud($ctags);
5686                 print git_show_project_tagcloud($cloud, 64);
5687         }
5688
5689         print "<table class=\"project_list\">\n";
5690         unless ($no_header) {
5691                 print "<tr>\n";
5692                 if ($check_forks) {
5693                         print "<th></th>\n";
5694                 }
5695                 print_sort_th('project', $order, 'Project');
5696                 print_sort_th('descr', $order, 'Description');
5697                 print_sort_th('owner', $order, 'Owner') unless $omit_owner;
5698                 print_sort_th('age', $order, 'Last Change') unless $omit_age_column;
5699                 print "<th></th>\n" . # for links
5700                       "</tr>\n";
5701         }
5702
5703         if ($projects_list_group_categories) {
5704                 # only display categories with projects in the $from-$to window
5705                 @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5706                 my %categories = build_projlist_by_category(\@projects, $from, $to);
5707                 foreach my $cat (sort keys %categories) {
5708                         unless ($cat eq "") {
5709                                 print "<tr>\n";
5710                                 if ($check_forks) {
5711                                         print "<td></td>\n";
5712                                 }
5713                                 print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5714                                 print "</tr>\n";
5715                         }
5716
5717                         git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5718                 }
5719         } else {
5720                 git_project_list_rows(\@projects, $from, $to, $check_forks);
5721         }
5722
5723         if (defined $extra) {
5724                 print "<tr>\n";
5725                 if ($check_forks) {
5726                         print "<td></td>\n";
5727                 }
5728                 print "<td colspan=\"5\">$extra</td>\n" .
5729                       "</tr>\n";
5730         }
5731         print "</table>\n";
5732 }
5733
5734 sub git_log_body {
5735         # uses global variable $project
5736         my ($commitlist, $from, $to, $refs, $extra) = @_;
5737
5738         $from = 0 unless defined $from;
5739         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5740
5741         for (my $i = 0; $i <= $to; $i++) {
5742                 my %co = %{$commitlist->[$i]};
5743                 next if !%co;
5744                 my $commit = $co{'id'};
5745                 my $ref = format_ref_marker($refs, $commit);
5746                 git_print_header_div('commit',
5747                                "<span class=\"age\">$co{'age_string'}</span>" .
5748                                esc_html($co{'title'}) . $ref,
5749                                $commit);
5750                 print "<div class=\"title_text\">\n" .
5751                       "<div class=\"log_link\">\n" .
5752                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5753                       " | " .
5754                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5755                       " | " .
5756                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5757                       "<br/>\n" .
5758                       "</div>\n";
5759                       git_print_authorship(\%co, -tag => 'span');
5760                       print "<br/>\n</div>\n";
5761
5762                 print "<div class=\"log_body\">\n";
5763                 git_print_log($co{'comment'}, -final_empty_line=> 1);
5764                 print "</div>\n";
5765         }
5766         if ($extra) {
5767                 print "<div class=\"page_nav\">\n";
5768                 print "$extra\n";
5769                 print "</div>\n";
5770         }
5771 }
5772
5773 sub git_shortlog_body {
5774         # uses global variable $project
5775         my ($commitlist, $from, $to, $refs, $extra) = @_;
5776
5777         $from = 0 unless defined $from;
5778         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5779
5780         print "<table class=\"shortlog\">\n";
5781         my $alternate = 1;
5782         for (my $i = $from; $i <= $to; $i++) {
5783                 my %co = %{$commitlist->[$i]};
5784                 my $commit = $co{'id'};
5785                 my $ref = format_ref_marker($refs, $commit);
5786                 if ($alternate) {
5787                         print "<tr class=\"dark\">\n";
5788                 } else {
5789                         print "<tr class=\"light\">\n";
5790                 }
5791                 $alternate ^= 1;
5792                 # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5793                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5794                       format_author_html('td', \%co, 10) . "<td>";
5795                 print format_subject_html($co{'title'}, $co{'title_short'},
5796                                           href(action=>"commit", hash=>$commit), $ref);
5797                 print "</td>\n" .
5798                       "<td class=\"link\">" .
5799                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5800                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5801                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5802                 my $snapshot_links = format_snapshot_links($commit);
5803                 if (defined $snapshot_links) {
5804                         print " | " . $snapshot_links;
5805                 }
5806                 print "</td>\n" .
5807                       "</tr>\n";
5808         }
5809         if (defined $extra) {
5810                 print "<tr>\n" .
5811                       "<td colspan=\"4\">$extra</td>\n" .
5812                       "</tr>\n";
5813         }
5814         print "</table>\n";
5815 }
5816
5817 sub git_history_body {
5818         # Warning: assumes constant type (blob or tree) during history
5819         my ($commitlist, $from, $to, $refs, $extra,
5820             $file_name, $file_hash, $ftype) = @_;
5821
5822         $from = 0 unless defined $from;
5823         $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5824
5825         print "<table class=\"history\">\n";
5826         my $alternate = 1;
5827         for (my $i = $from; $i <= $to; $i++) {
5828                 my %co = %{$commitlist->[$i]};
5829                 if (!%co) {
5830                         next;
5831                 }
5832                 my $commit = $co{'id'};
5833
5834                 my $ref = format_ref_marker($refs, $commit);
5835
5836                 if ($alternate) {
5837                         print "<tr class=\"dark\">\n";
5838                 } else {
5839                         print "<tr class=\"light\">\n";
5840                 }
5841                 $alternate ^= 1;
5842                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5843         # shortlog:   format_author_html('td', \%co, 10)
5844                       format_author_html('td', \%co, 15, 3) . "<td>";
5845                 # originally git_history used chop_str($co{'title'}, 50)
5846                 print format_subject_html($co{'title'}, $co{'title_short'},
5847                                           href(action=>"commit", hash=>$commit), $ref);
5848                 print "</td>\n" .
5849                       "<td class=\"link\">" .
5850                       $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5851                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5852
5853                 if ($ftype eq 'blob') {
5854                         my $blob_current = $file_hash;
5855                         my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5856                         if (defined $blob_current && defined $blob_parent &&
5857                                         $blob_current ne $blob_parent) {
5858                                 print " | " .
5859                                         $cgi->a({-href => href(action=>"blobdiff",
5860                                                                hash=>$blob_current, hash_parent=>$blob_parent,
5861                                                                hash_base=>$hash_base, hash_parent_base=>$commit,
5862                                                                file_name=>$file_name)},
5863                                                 "diff to current");
5864                         }
5865                 }
5866                 print "</td>\n" .
5867                       "</tr>\n";
5868         }
5869         if (defined $extra) {
5870                 print "<tr>\n" .
5871                       "<td colspan=\"4\">$extra</td>\n" .
5872                       "</tr>\n";
5873         }
5874         print "</table>\n";
5875 }
5876
5877 sub git_tags_body {
5878         # uses global variable $project
5879         my ($taglist, $from, $to, $extra) = @_;
5880         $from = 0 unless defined $from;
5881         $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5882
5883         print "<table class=\"tags\">\n";
5884         my $alternate = 1;
5885         for (my $i = $from; $i <= $to; $i++) {
5886                 my $entry = $taglist->[$i];
5887                 my %tag = %$entry;
5888                 my $comment = $tag{'subject'};
5889                 my $comment_short;
5890                 if (defined $comment) {
5891                         $comment_short = chop_str($comment, 30, 5);
5892                 }
5893                 if ($alternate) {
5894                         print "<tr class=\"dark\">\n";
5895                 } else {
5896                         print "<tr class=\"light\">\n";
5897                 }
5898                 $alternate ^= 1;
5899                 if (defined $tag{'age'}) {
5900                         print "<td><i>$tag{'age'}</i></td>\n";
5901                 } else {
5902                         print "<td></td>\n";
5903                 }
5904                 print "<td>" .
5905                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5906                                -class => "list name"}, esc_html($tag{'name'})) .
5907                       "</td>\n" .
5908                       "<td>";
5909                 if (defined $comment) {
5910                         print format_subject_html($comment, $comment_short,
5911                                                   href(action=>"tag", hash=>$tag{'id'}));
5912                 }
5913                 print "</td>\n" .
5914                       "<td class=\"selflink\">";
5915                 if ($tag{'type'} eq "tag") {
5916                         print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5917                 } else {
5918                         print "&nbsp;";
5919                 }
5920                 print "</td>\n" .
5921                       "<td class=\"link\">" . " | " .
5922                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5923                 if ($tag{'reftype'} eq "commit") {
5924                         print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5925                               " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5926                 } elsif ($tag{'reftype'} eq "blob") {
5927                         print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5928                 }
5929                 print "</td>\n" .
5930                       "</tr>";
5931         }
5932         if (defined $extra) {
5933                 print "<tr>\n" .
5934                       "<td colspan=\"5\">$extra</td>\n" .
5935                       "</tr>\n";
5936         }
5937         print "</table>\n";
5938 }
5939
5940 sub git_heads_body {
5941         # uses global variable $project
5942         my ($headlist, $head_at, $from, $to, $extra) = @_;
5943         $from = 0 unless defined $from;
5944         $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5945
5946         print "<table class=\"heads\">\n";
5947         my $alternate = 1;
5948         for (my $i = $from; $i <= $to; $i++) {
5949                 my $entry = $headlist->[$i];
5950                 my %ref = %$entry;
5951                 my $curr = defined $head_at && $ref{'id'} eq $head_at;
5952                 if ($alternate) {
5953                         print "<tr class=\"dark\">\n";
5954                 } else {
5955                         print "<tr class=\"light\">\n";
5956                 }
5957                 $alternate ^= 1;
5958                 print "<td><i>$ref{'age'}</i></td>\n" .
5959                       ($curr ? "<td class=\"current_head\">" : "<td>") .
5960                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5961                                -class => "list name"},esc_html($ref{'name'})) .
5962                       "</td>\n" .
5963                       "<td class=\"link\">" .
5964                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5965                       $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5966                       $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5967                       "</td>\n" .
5968                       "</tr>";
5969         }
5970         if (defined $extra) {
5971                 print "<tr>\n" .
5972                       "<td colspan=\"3\">$extra</td>\n" .
5973                       "</tr>\n";
5974         }
5975         print "</table>\n";
5976 }
5977
5978 # Display a single remote block
5979 sub git_remote_block {
5980         my ($remote, $rdata, $limit, $head) = @_;
5981
5982         my $heads = $rdata->{'heads'};
5983         my $fetch = $rdata->{'fetch'};
5984         my $push = $rdata->{'push'};
5985
5986         my $urls_table = "<table class=\"projects_list\">\n" ;
5987
5988         if (defined $fetch) {
5989                 if ($fetch eq $push) {
5990                         $urls_table .= format_repo_url("URL", $fetch);
5991                 } else {
5992                         $urls_table .= format_repo_url("Fetch URL", $fetch);
5993                         $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5994                 }
5995         } elsif (defined $push) {
5996                 $urls_table .= format_repo_url("Push URL", $push);
5997         } else {
5998                 $urls_table .= format_repo_url("", "No remote URL");
5999         }
6000
6001         $urls_table .= "</table>\n";
6002
6003         my $dots;
6004         if (defined $limit && $limit < @$heads) {
6005                 $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
6006         }
6007
6008         print $urls_table;
6009         git_heads_body($heads, $head, 0, $limit, $dots);
6010 }
6011
6012 # Display a list of remote names with the respective fetch and push URLs
6013 sub git_remotes_list {
6014         my ($remotedata, $limit) = @_;
6015         print "<table class=\"heads\">\n";
6016         my $alternate = 1;
6017         my @remotes = sort keys %$remotedata;
6018
6019         my $limited = $limit && $limit < @remotes;
6020
6021         $#remotes = $limit - 1 if $limited;
6022
6023         while (my $remote = shift @remotes) {
6024                 my $rdata = $remotedata->{$remote};
6025                 my $fetch = $rdata->{'fetch'};
6026                 my $push = $rdata->{'push'};
6027                 if ($alternate) {
6028                         print "<tr class=\"dark\">\n";
6029                 } else {
6030                         print "<tr class=\"light\">\n";
6031                 }
6032                 $alternate ^= 1;
6033                 print "<td>" .
6034                       $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
6035                                -class=> "list name"},esc_html($remote)) .
6036                       "</td>";
6037                 print "<td class=\"link\">" .
6038                       (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
6039                       " | " .
6040                       (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
6041                       "</td>";
6042
6043                 print "</tr>\n";
6044         }
6045
6046         if ($limited) {
6047                 print "<tr>\n" .
6048                       "<td colspan=\"3\">" .
6049                       $cgi->a({-href => href(action=>"remotes")}, "...") .
6050                       "</td>\n" . "</tr>\n";
6051         }
6052
6053         print "</table>";
6054 }
6055
6056 # Display remote heads grouped by remote, unless there are too many
6057 # remotes, in which case we only display the remote names
6058 sub git_remotes_body {
6059         my ($remotedata, $limit, $head) = @_;
6060         if ($limit and $limit < keys %$remotedata) {
6061                 git_remotes_list($remotedata, $limit);
6062         } else {
6063                 fill_remote_heads($remotedata);
6064                 while (my ($remote, $rdata) = each %$remotedata) {
6065                         git_print_section({-class=>"remote", -id=>$remote},
6066                                 ["remotes", $remote, $remote], sub {
6067                                         git_remote_block($remote, $rdata, $limit, $head);
6068                                 });
6069                 }
6070         }
6071 }
6072
6073 sub git_search_message {
6074         my %co = @_;
6075
6076         my $greptype;
6077         if ($searchtype eq 'commit') {
6078                 $greptype = "--grep=";
6079         } elsif ($searchtype eq 'author') {
6080                 $greptype = "--author=";
6081         } elsif ($searchtype eq 'committer') {
6082                 $greptype = "--committer=";
6083         }
6084         $greptype .= $searchtext;
6085         my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
6086                                        $greptype, '--regexp-ignore-case',
6087                                        $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
6088
6089         my $paging_nav = '';
6090         if ($page > 0) {
6091                 $paging_nav .=
6092                         $cgi->a({-href => href(-replay=>1, page=>undef)},
6093                                 "first") .
6094                         " &sdot; " .
6095                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
6096                                  -accesskey => "p", -title => "Alt-p"}, "prev");
6097         } else {
6098                 $paging_nav .= "first &sdot; prev";
6099         }
6100         my $next_link = '';
6101         if ($#commitlist >= 100) {
6102                 $next_link =
6103                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
6104                                  -accesskey => "n", -title => "Alt-n"}, "next");
6105                 $paging_nav .= " &sdot; $next_link";
6106         } else {
6107                 $paging_nav .= " &sdot; next";
6108         }
6109
6110         git_header_html();
6111
6112         git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
6113         git_print_header_div('commit', esc_html($co{'title'}), $hash);
6114         if ($page == 0 && !@commitlist) {
6115                 print "<p>No match.</p>\n";
6116         } else {
6117                 git_search_grep_body(\@commitlist, 0, 99, $next_link);
6118         }
6119
6120         git_footer_html();
6121 }
6122
6123 sub git_search_changes {
6124         my %co = @_;
6125
6126         local $/ = "\n";
6127         open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
6128                 '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
6129                 ($search_use_regexp ? '--pickaxe-regex' : ())
6130                         or die_error(500, "Open git-log failed");
6131
6132         git_header_html();
6133
6134         git_print_page_nav('','', $hash,$co{'tree'},$hash);
6135         git_print_header_div('commit', esc_html($co{'title'}), $hash);
6136
6137         print "<table class=\"pickaxe search\">\n";
6138         my $alternate = 1;
6139         undef %co;
6140         my @files;
6141         while (my $line = <$fd>) {
6142                 chomp $line;
6143                 next unless $line;
6144
6145                 my %set = parse_difftree_raw_line($line);
6146                 if (defined $set{'commit'}) {
6147                         # finish previous commit
6148                         if (%co) {
6149                                 print "</td>\n" .
6150                                       "<td class=\"link\">" .
6151                                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
6152                                               "commit") .
6153                                       " | " .
6154                                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
6155                                                              hash_base=>$co{'id'})},
6156                                               "tree") .
6157                                       "</td>\n" .
6158                                       "</tr>\n";
6159                         }
6160
6161                         if ($alternate) {
6162                                 print "<tr class=\"dark\">\n";
6163                         } else {
6164                                 print "<tr class=\"light\">\n";
6165                         }
6166                         $alternate ^= 1;
6167                         %co = parse_commit($set{'commit'});
6168                         my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6169                         print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6170                               "<td><i>$author</i></td>\n" .
6171                               "<td>" .
6172                               $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6173                                       -class => "list subject"},
6174                                       chop_and_escape_str($co{'title'}, 50) . "<br/>");
6175                 } elsif (defined $set{'to_id'}) {
6176                         next if ($set{'to_id'} =~ m/^0{40}$/);
6177
6178                         print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6179                                                      hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6180                                       -class => "list"},
6181                                       "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6182                               "<br/>\n";
6183                 }
6184         }
6185         close $fd;
6186
6187         # finish last commit (warning: repetition!)
6188         if (%co) {
6189                 print "</td>\n" .
6190                       "<td class=\"link\">" .
6191                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
6192                               "commit") .
6193                       " | " .
6194                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
6195                                              hash_base=>$co{'id'})},
6196                               "tree") .
6197                       "</td>\n" .
6198                       "</tr>\n";
6199         }
6200
6201         print "</table>\n";
6202
6203         git_footer_html();
6204 }
6205
6206 sub git_search_files {
6207         my %co = @_;
6208
6209         local $/ = "\n";
6210         open my $fd, "-|", git_cmd(), 'grep', '-n', '-z',
6211                 $search_use_regexp ? ('-E', '-i') : '-F',
6212                 $searchtext, $co{'tree'}
6213                         or die_error(500, "Open git-grep failed");
6214
6215         git_header_html();
6216
6217         git_print_page_nav('','', $hash,$co{'tree'},$hash);
6218         git_print_header_div('commit', esc_html($co{'title'}), $hash);
6219
6220         print "<table class=\"grep_search\">\n";
6221         my $alternate = 1;
6222         my $matches = 0;
6223         my $lastfile = '';
6224         my $file_href;
6225         while (my $line = <$fd>) {
6226                 chomp $line;
6227                 my ($file, $lno, $ltext, $binary);
6228                 last if ($matches++ > 1000);
6229                 if ($line =~ /^Binary file (.+) matches$/) {
6230                         $file = $1;
6231                         $binary = 1;
6232                 } else {
6233                         ($file, $lno, $ltext) = split(/\0/, $line, 3);
6234                         $file =~ s/^$co{'tree'}://;
6235                 }
6236                 if ($file ne $lastfile) {
6237                         $lastfile and print "</td></tr>\n";
6238                         if ($alternate++) {
6239                                 print "<tr class=\"dark\">\n";
6240                         } else {
6241                                 print "<tr class=\"light\">\n";
6242                         }
6243                         $file_href = href(action=>"blob", hash_base=>$co{'id'},
6244                                           file_name=>$file);
6245                         print "<td class=\"list\">".
6246                                 $cgi->a({-href => $file_href, -class => "list"}, esc_path($file));
6247                         print "</td><td>\n";
6248                         $lastfile = $file;
6249                 }
6250                 if ($binary) {
6251                         print "<div class=\"binary\">Binary file</div>\n";
6252                 } else {
6253                         $ltext = untabify($ltext);
6254                         if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6255                                 $ltext = esc_html($1, -nbsp=>1);
6256                                 $ltext .= '<span class="match">';
6257                                 $ltext .= esc_html($2, -nbsp=>1);
6258                                 $ltext .= '</span>';
6259                                 $ltext .= esc_html($3, -nbsp=>1);
6260                         } else {
6261                                 $ltext = esc_html($ltext, -nbsp=>1);
6262                         }
6263                         print "<div class=\"pre\">" .
6264                                 $cgi->a({-href => $file_href.'#l'.$lno,
6265                                         -class => "linenr"}, sprintf('%4i', $lno)) .
6266                                 ' ' .  $ltext . "</div>\n";
6267                 }
6268         }
6269         if ($lastfile) {
6270                 print "</td></tr>\n";
6271                 if ($matches > 1000) {
6272                         print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6273                 }
6274         } else {
6275                 print "<div class=\"diff nodifferences\">No matches found</div>\n";
6276         }
6277         close $fd;
6278
6279         print "</table>\n";
6280
6281         git_footer_html();
6282 }
6283
6284 sub git_search_grep_body {
6285         my ($commitlist, $from, $to, $extra) = @_;
6286         $from = 0 unless defined $from;
6287         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
6288
6289         print "<table class=\"commit_search\">\n";
6290         my $alternate = 1;
6291         for (my $i = $from; $i <= $to; $i++) {
6292                 my %co = %{$commitlist->[$i]};
6293                 if (!%co) {
6294                         next;
6295                 }
6296                 my $commit = $co{'id'};
6297                 if ($alternate) {
6298                         print "<tr class=\"dark\">\n";
6299                 } else {
6300                         print "<tr class=\"light\">\n";
6301                 }
6302                 $alternate ^= 1;
6303                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6304                       format_author_html('td', \%co, 15, 5) .
6305                       "<td>" .
6306                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6307                                -class => "list subject"},
6308                               chop_and_escape_str($co{'title'}, 50) . "<br/>");
6309                 my $comment = $co{'comment'};
6310                 foreach my $line (@$comment) {
6311                         if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
6312                                 my ($lead, $match, $trail) = ($1, $2, $3);
6313                                 $match = chop_str($match, 70, 5, 'center');
6314                                 my $contextlen = int((80 - length($match))/2);
6315                                 $contextlen = 30 if ($contextlen > 30);
6316                                 $lead  = chop_str($lead,  $contextlen, 10, 'left');
6317                                 $trail = chop_str($trail, $contextlen, 10, 'right');
6318
6319                                 $lead  = esc_html($lead);
6320                                 $match = esc_html($match);
6321                                 $trail = esc_html($trail);
6322
6323                                 print "$lead<span class=\"match\">$match</span>$trail<br />";
6324                         }
6325                 }
6326                 print "</td>\n" .
6327                       "<td class=\"link\">" .
6328                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6329                       " | " .
6330                       $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
6331                       " | " .
6332                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6333                 print "</td>\n" .
6334                       "</tr>\n";
6335         }
6336         if (defined $extra) {
6337                 print "<tr>\n" .
6338                       "<td colspan=\"3\">$extra</td>\n" .
6339                       "</tr>\n";
6340         }
6341         print "</table>\n";
6342 }
6343
6344 ## ======================================================================
6345 ## ======================================================================
6346 ## actions
6347
6348 sub git_project_list {
6349         my $order = $input_params{'order'};
6350         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6351                 die_error(400, "Unknown order parameter");
6352         }
6353
6354         my @list = git_get_projects_list($project_filter, $strict_export);
6355         if (!@list) {
6356                 die_error(404, "No projects found");
6357         }
6358
6359         git_header_html();
6360         if (defined $home_text && -f $home_text) {
6361                 print "<div class=\"index_include\">\n";
6362                 insert_file($home_text);
6363                 print "</div>\n";
6364         }
6365
6366         git_project_search_form($searchtext, $search_use_regexp);
6367         git_project_list_body(\@list, $order);
6368         git_footer_html();
6369 }
6370
6371 sub git_forks {
6372         my $order = $input_params{'order'};
6373         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6374                 die_error(400, "Unknown order parameter");
6375         }
6376
6377         my $filter = $project;
6378         $filter =~ s/\.git$//;
6379         my @list = git_get_projects_list($filter);
6380         if (!@list) {
6381                 die_error(404, "No forks found");
6382         }
6383
6384         git_header_html();
6385         git_print_page_nav('','');
6386         git_print_header_div('summary', "$project forks");
6387         git_project_list_body(\@list, $order);
6388         git_footer_html();
6389 }
6390
6391 sub git_project_index {
6392         my @projects = git_get_projects_list($project_filter, $strict_export);
6393         if (!@projects) {
6394                 die_error(404, "No projects found");
6395         }
6396
6397         print $cgi->header(
6398                 -type => 'text/plain',
6399                 -charset => 'utf-8',
6400                 -content_disposition => 'inline; filename="index.aux"');
6401
6402         foreach my $pr (@projects) {
6403                 if (!exists $pr->{'owner'}) {
6404                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6405                 }
6406
6407                 my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6408                 # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6409                 $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6410                 $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6411                 $path  =~ s/ /\+/g;
6412                 $owner =~ s/ /\+/g;
6413
6414                 print "$path $owner\n";
6415         }
6416 }
6417
6418 sub git_summary {
6419         my $descr = git_get_project_description($project) || "none";
6420         my %co = parse_commit("HEAD");
6421         my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6422         my $head = $co{'id'};
6423         my $remote_heads = gitweb_check_feature('remote_heads');
6424
6425         my $owner = git_get_project_owner($project);
6426
6427         my $refs = git_get_references();
6428         # These get_*_list functions return one more to allow us to see if
6429         # there are more ...
6430         my @taglist  = git_get_tags_list(16);
6431         my @headlist = git_get_heads_list(16);
6432         my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6433         my @forklist;
6434         my $check_forks = gitweb_check_feature('forks');
6435
6436         if ($check_forks) {
6437                 # find forks of a project
6438                 my $filter = $project;
6439                 $filter =~ s/\.git$//;
6440                 @forklist = git_get_projects_list($filter);
6441                 # filter out forks of forks
6442                 @forklist = filter_forks_from_projects_list(\@forklist)
6443                         if (@forklist);
6444         }
6445
6446         git_header_html();
6447         git_print_page_nav('summary','', $head);
6448
6449         print "<div class=\"title\">&nbsp;</div>\n";
6450         print "<table class=\"projects_list\">\n" .
6451               "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n";
6452         unless ($omit_owner) {
6453                 print  "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6454         }
6455         if (defined $cd{'rfc2822'}) {
6456                 print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6457                       "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6458         }
6459
6460         # use per project git URL list in $projectroot/$project/cloneurl
6461         # or make project git URL from git base URL and project name
6462         my $url_tag = "URL";
6463         my @url_list = git_get_project_url_list($project);
6464         @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6465         foreach my $git_url (@url_list) {
6466                 next unless $git_url;
6467                 print format_repo_url($url_tag, $git_url);
6468                 $url_tag = "";
6469         }
6470
6471         # Tag cloud
6472         my $show_ctags = gitweb_check_feature('ctags');
6473         if ($show_ctags) {
6474                 my $ctags = git_get_project_ctags($project);
6475                 if (%$ctags) {
6476                         # without ability to add tags, don't show if there are none
6477                         my $cloud = git_populate_project_tagcloud($ctags);
6478                         print "<tr id=\"metadata_ctags\">" .
6479                               "<td>content tags</td>" .
6480                               "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6481                               "</tr>\n";
6482                 }
6483         }
6484
6485         print "</table>\n";
6486
6487         # If XSS prevention is on, we don't include README.html.
6488         # TODO: Allow a readme in some safe format.
6489         if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6490                 print "<div class=\"title\">readme</div>\n" .
6491                       "<div class=\"readme\">\n";
6492                 insert_file("$projectroot/$project/README.html");
6493                 print "\n</div>\n"; # class="readme"
6494         }
6495
6496         # we need to request one more than 16 (0..15) to check if
6497         # those 16 are all
6498         my @commitlist = $head ? parse_commits($head, 17) : ();
6499         if (@commitlist) {
6500                 git_print_header_div('shortlog');
6501                 git_shortlog_body(\@commitlist, 0, 15, $refs,
6502                                   $#commitlist <=  15 ? undef :
6503                                   $cgi->a({-href => href(action=>"shortlog")}, "..."));
6504         }
6505
6506         if (@taglist) {
6507                 git_print_header_div('tags');
6508                 git_tags_body(\@taglist, 0, 15,
6509                               $#taglist <=  15 ? undef :
6510                               $cgi->a({-href => href(action=>"tags")}, "..."));
6511         }
6512
6513         if (@headlist) {
6514                 git_print_header_div('heads');
6515                 git_heads_body(\@headlist, $head, 0, 15,
6516                                $#headlist <= 15 ? undef :
6517                                $cgi->a({-href => href(action=>"heads")}, "..."));
6518         }
6519
6520         if (%remotedata) {
6521                 git_print_header_div('remotes');
6522                 git_remotes_body(\%remotedata, 15, $head);
6523         }
6524
6525         if (@forklist) {
6526                 git_print_header_div('forks');
6527                 git_project_list_body(\@forklist, 'age', 0, 15,
6528                                       $#forklist <= 15 ? undef :
6529                                       $cgi->a({-href => href(action=>"forks")}, "..."),
6530                                       'no_header');
6531         }
6532
6533         git_footer_html();
6534 }
6535
6536 sub git_tag {
6537         my %tag = parse_tag($hash);
6538
6539         if (! %tag) {
6540                 die_error(404, "Unknown tag object");
6541         }
6542
6543         my $head = git_get_head_hash($project);
6544         git_header_html();
6545         git_print_page_nav('','', $head,undef,$head);
6546         git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6547         print "<div class=\"title_text\">\n" .
6548               "<table class=\"object_header\">\n" .
6549               "<tr>\n" .
6550               "<td>object</td>\n" .
6551               "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6552                                $tag{'object'}) . "</td>\n" .
6553               "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6554                                               $tag{'type'}) . "</td>\n" .
6555               "</tr>\n";
6556         if (defined($tag{'author'})) {
6557                 git_print_authorship_rows(\%tag, 'author');
6558         }
6559         print "</table>\n\n" .
6560               "</div>\n";
6561         print "<div class=\"page_body\">";
6562         my $comment = $tag{'comment'};
6563         foreach my $line (@$comment) {
6564                 chomp $line;
6565                 print esc_html($line, -nbsp=>1) . "<br/>\n";
6566         }
6567         print "</div>\n";
6568         git_footer_html();
6569 }
6570
6571 sub git_blame_common {
6572         my $format = shift || 'porcelain';
6573         if ($format eq 'porcelain' && $input_params{'javascript'}) {
6574                 $format = 'incremental';
6575                 $action = 'blame_incremental'; # for page title etc
6576         }
6577
6578         # permissions
6579         gitweb_check_feature('blame')
6580                 or die_error(403, "Blame view not allowed");
6581
6582         # error checking
6583         die_error(400, "No file name given") unless $file_name;
6584         $hash_base ||= git_get_head_hash($project);
6585         die_error(404, "Couldn't find base commit") unless $hash_base;
6586         my %co = parse_commit($hash_base)
6587                 or die_error(404, "Commit not found");
6588         my $ftype = "blob";
6589         if (!defined $hash) {
6590                 $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6591                         or die_error(404, "Error looking up file");
6592         } else {
6593                 $ftype = git_get_type($hash);
6594                 if ($ftype !~ "blob") {
6595                         die_error(400, "Object is not a blob");
6596                 }
6597         }
6598
6599         my $fd;
6600         if ($format eq 'incremental') {
6601                 # get file contents (as base)
6602                 open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6603                         or die_error(500, "Open git-cat-file failed");
6604         } elsif ($format eq 'data') {
6605                 # run git-blame --incremental
6606                 open $fd, "-|", git_cmd(), "blame", "--incremental",
6607                         $hash_base, "--", $file_name
6608                         or die_error(500, "Open git-blame --incremental failed");
6609         } else {
6610                 # run git-blame --porcelain
6611                 open $fd, "-|", git_cmd(), "blame", '-p',
6612                         $hash_base, '--', $file_name
6613                         or die_error(500, "Open git-blame --porcelain failed");
6614         }
6615
6616         # incremental blame data returns early
6617         if ($format eq 'data') {
6618                 print $cgi->header(
6619                         -type=>"text/plain", -charset => "utf-8",
6620                         -status=> "200 OK");
6621                 local $| = 1; # output autoflush
6622                 while (my $line = <$fd>) {
6623                         print to_utf8($line);
6624                 }
6625                 close $fd
6626                         or print "ERROR $!\n";
6627
6628                 print 'END';
6629                 if (defined $t0 && gitweb_check_feature('timed')) {
6630                         print ' '.
6631                               tv_interval($t0, [ gettimeofday() ]).
6632                               ' '.$number_of_git_cmds;
6633                 }
6634                 print "\n";
6635
6636                 return;
6637         }
6638
6639         # page header
6640         git_header_html();
6641         my $formats_nav =
6642                 $cgi->a({-href => href(action=>"blob", -replay=>1)},
6643                         "blob") .
6644                 " | ";
6645         if ($format eq 'incremental') {
6646                 $formats_nav .=
6647                         $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6648                                 "blame") . " (non-incremental)";
6649         } else {
6650                 $formats_nav .=
6651                         $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6652                                 "blame") . " (incremental)";
6653         }
6654         $formats_nav .=
6655                 " | " .
6656                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6657                         "history") .
6658                 " | " .
6659                 $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6660                         "HEAD");
6661         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6662         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6663         git_print_page_path($file_name, $ftype, $hash_base);
6664
6665         # page body
6666         if ($format eq 'incremental') {
6667                 print "<noscript>\n<div class=\"error\"><center><b>\n".
6668                       "This page requires JavaScript to run.\n Use ".
6669                       $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6670                               'this page').
6671                       " instead.\n".
6672                       "</b></center></div>\n</noscript>\n";
6673
6674                 print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6675         }
6676
6677         print qq!<div class="page_body">\n!;
6678         print qq!<div id="progress_info">... / ...</div>\n!
6679                 if ($format eq 'incremental');
6680         print qq!<table id="blame_table" class="blame" width="100%">\n!.
6681               #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6682               qq!<thead>\n!.
6683               qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6684               qq!</thead>\n!.
6685               qq!<tbody>\n!;
6686
6687         my @rev_color = qw(light dark);
6688         my $num_colors = scalar(@rev_color);
6689         my $current_color = 0;
6690
6691         if ($format eq 'incremental') {
6692                 my $color_class = $rev_color[$current_color];
6693
6694                 #contents of a file
6695                 my $linenr = 0;
6696         LINE:
6697                 while (my $line = <$fd>) {
6698                         chomp $line;
6699                         $linenr++;
6700
6701                         print qq!<tr id="l$linenr" class="$color_class">!.
6702                               qq!<td class="sha1"><a href=""> </a></td>!.
6703                               qq!<td class="linenr">!.
6704                               qq!<a class="linenr" href="">$linenr</a></td>!;
6705                         print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6706                         print qq!</tr>\n!;
6707                 }
6708
6709         } else { # porcelain, i.e. ordinary blame
6710                 my %metainfo = (); # saves information about commits
6711
6712                 # blame data
6713         LINE:
6714                 while (my $line = <$fd>) {
6715                         chomp $line;
6716                         # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6717                         # no <lines in group> for subsequent lines in group of lines
6718                         my ($full_rev, $orig_lineno, $lineno, $group_size) =
6719                            ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6720                         if (!exists $metainfo{$full_rev}) {
6721                                 $metainfo{$full_rev} = { 'nprevious' => 0 };
6722                         }
6723                         my $meta = $metainfo{$full_rev};
6724                         my $data;
6725                         while ($data = <$fd>) {
6726                                 chomp $data;
6727                                 last if ($data =~ s/^\t//); # contents of line
6728                                 if ($data =~ /^(\S+)(?: (.*))?$/) {
6729                                         $meta->{$1} = $2 unless exists $meta->{$1};
6730                                 }
6731                                 if ($data =~ /^previous /) {
6732                                         $meta->{'nprevious'}++;
6733                                 }
6734                         }
6735                         my $short_rev = substr($full_rev, 0, 8);
6736                         my $author = $meta->{'author'};
6737                         my %date =
6738                                 parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6739                         my $date = $date{'iso-tz'};
6740                         if ($group_size) {
6741                                 $current_color = ($current_color + 1) % $num_colors;
6742                         }
6743                         my $tr_class = $rev_color[$current_color];
6744                         $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6745                         $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6746                         $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6747                         print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6748                         if ($group_size) {
6749                                 print "<td class=\"sha1\"";
6750                                 print " title=\"". esc_html($author) . ", $date\"";
6751                                 print " rowspan=\"$group_size\"" if ($group_size > 1);
6752                                 print ">";
6753                                 print $cgi->a({-href => href(action=>"commit",
6754                                                              hash=>$full_rev,
6755                                                              file_name=>$file_name)},
6756                                               esc_html($short_rev));
6757                                 if ($group_size >= 2) {
6758                                         my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6759                                         if (@author_initials) {
6760                                                 print "<br />" .
6761                                                       esc_html(join('', @author_initials));
6762                                                 #           or join('.', ...)
6763                                         }
6764                                 }
6765                                 print "</td>\n";
6766                         }
6767                         # 'previous' <sha1 of parent commit> <filename at commit>
6768                         if (exists $meta->{'previous'} &&
6769                             $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6770                                 $meta->{'parent'} = $1;
6771                                 $meta->{'file_parent'} = unquote($2);
6772                         }
6773                         my $linenr_commit =
6774                                 exists($meta->{'parent'}) ?
6775                                 $meta->{'parent'} : $full_rev;
6776                         my $linenr_filename =
6777                                 exists($meta->{'file_parent'}) ?
6778                                 $meta->{'file_parent'} : unquote($meta->{'filename'});
6779                         my $blamed = href(action => 'blame',
6780                                           file_name => $linenr_filename,
6781                                           hash_base => $linenr_commit);
6782                         print "<td class=\"linenr\">";
6783                         print $cgi->a({ -href => "$blamed#l$orig_lineno",
6784                                         -class => "linenr" },
6785                                       esc_html($lineno));
6786                         print "</td>";
6787                         print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6788                         print "</tr>\n";
6789                 } # end while
6790
6791         }
6792
6793         # footer
6794         print "</tbody>\n".
6795               "</table>\n"; # class="blame"
6796         print "</div>\n";   # class="blame_body"
6797         close $fd
6798                 or print "Reading blob failed\n";
6799
6800         git_footer_html();
6801 }
6802
6803 sub git_blame {
6804         git_blame_common();
6805 }
6806
6807 sub git_blame_incremental {
6808         git_blame_common('incremental');
6809 }
6810
6811 sub git_blame_data {
6812         git_blame_common('data');
6813 }
6814
6815 sub git_tags {
6816         my $head = git_get_head_hash($project);
6817         git_header_html();
6818         git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6819         git_print_header_div('summary', $project);
6820
6821         my @tagslist = git_get_tags_list();
6822         if (@tagslist) {
6823                 git_tags_body(\@tagslist);
6824         }
6825         git_footer_html();
6826 }
6827
6828 sub git_heads {
6829         my $head = git_get_head_hash($project);
6830         git_header_html();
6831         git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6832         git_print_header_div('summary', $project);
6833
6834         my @headslist = git_get_heads_list();
6835         if (@headslist) {
6836                 git_heads_body(\@headslist, $head);
6837         }
6838         git_footer_html();
6839 }
6840
6841 # used both for single remote view and for list of all the remotes
6842 sub git_remotes {
6843         gitweb_check_feature('remote_heads')
6844                 or die_error(403, "Remote heads view is disabled");
6845
6846         my $head = git_get_head_hash($project);
6847         my $remote = $input_params{'hash'};
6848
6849         my $remotedata = git_get_remotes_list($remote);
6850         die_error(500, "Unable to get remote information") unless defined $remotedata;
6851
6852         unless (%$remotedata) {
6853                 die_error(404, defined $remote ?
6854                         "Remote $remote not found" :
6855                         "No remotes found");
6856         }
6857
6858         git_header_html(undef, undef, -action_extra => $remote);
6859         git_print_page_nav('', '',  $head, undef, $head,
6860                 format_ref_views($remote ? '' : 'remotes'));
6861
6862         fill_remote_heads($remotedata);
6863         if (defined $remote) {
6864                 git_print_header_div('remotes', "$remote remote for $project");
6865                 git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6866         } else {
6867                 git_print_header_div('summary', "$project remotes");
6868                 git_remotes_body($remotedata, undef, $head);
6869         }
6870
6871         git_footer_html();
6872 }
6873
6874 sub git_blob_plain {
6875         my $type = shift;
6876         my $expires;
6877
6878         if (!defined $hash) {
6879                 if (defined $file_name) {
6880                         my $base = $hash_base || git_get_head_hash($project);
6881                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6882                                 or die_error(404, "Cannot find file");
6883                 } else {
6884                         die_error(400, "No file name defined");
6885                 }
6886         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6887                 # blobs defined by non-textual hash id's can be cached
6888                 $expires = "+1d";
6889         }
6890
6891         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6892                 or die_error(500, "Open git-cat-file blob '$hash' failed");
6893
6894         # content-type (can include charset)
6895         $type = blob_contenttype($fd, $file_name, $type);
6896
6897         # "save as" filename, even when no $file_name is given
6898         my $save_as = "$hash";
6899         if (defined $file_name) {
6900                 $save_as = $file_name;
6901         } elsif ($type =~ m/^text\//) {
6902                 $save_as .= '.txt';
6903         }
6904
6905         # With XSS prevention on, blobs of all types except a few known safe
6906         # ones are served with "Content-Disposition: attachment" to make sure
6907         # they don't run in our security domain.  For certain image types,
6908         # blob view writes an <img> tag referring to blob_plain view, and we
6909         # want to be sure not to break that by serving the image as an
6910         # attachment (though Firefox 3 doesn't seem to care).
6911         my $sandbox = $prevent_xss &&
6912                 $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6913
6914         # serve text/* as text/plain
6915         if ($prevent_xss &&
6916             ($type =~ m!^text/[a-z]+\b(.*)$! ||
6917              ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
6918                 my $rest = $1;
6919                 $rest = defined $rest ? $rest : '';
6920                 $type = "text/plain$rest";
6921         }
6922
6923         print $cgi->header(
6924                 -type => $type,
6925                 -expires => $expires,
6926                 -content_disposition =>
6927                         ($sandbox ? 'attachment' : 'inline')
6928                         . '; filename="' . $save_as . '"');
6929         local $/ = undef;
6930         binmode STDOUT, ':raw';
6931         print <$fd>;
6932         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6933         close $fd;
6934 }
6935
6936 sub git_blob {
6937         my $expires;
6938
6939         if (!defined $hash) {
6940                 if (defined $file_name) {
6941                         my $base = $hash_base || git_get_head_hash($project);
6942                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6943                                 or die_error(404, "Cannot find file");
6944                 } else {
6945                         die_error(400, "No file name defined");
6946                 }
6947         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6948                 # blobs defined by non-textual hash id's can be cached
6949                 $expires = "+1d";
6950         }
6951
6952         my $have_blame = gitweb_check_feature('blame');
6953         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6954                 or die_error(500, "Couldn't cat $file_name, $hash");
6955         my $mimetype = blob_mimetype($fd, $file_name);
6956         # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6957         if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6958                 close $fd;
6959                 return git_blob_plain($mimetype);
6960         }
6961         # we can have blame only for text/* mimetype
6962         $have_blame &&= ($mimetype =~ m!^text/!);
6963
6964         my $highlight = gitweb_check_feature('highlight');
6965         my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6966         $fd = run_highlighter($fd, $highlight, $syntax)
6967                 if $syntax;
6968
6969         git_header_html(undef, $expires);
6970         my $formats_nav = '';
6971         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6972                 if (defined $file_name) {
6973                         if ($have_blame) {
6974                                 $formats_nav .=
6975                                         $cgi->a({-href => href(action=>"blame", -replay=>1)},
6976                                                 "blame") .
6977                                         " | ";
6978                         }
6979                         $formats_nav .=
6980                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6981                                         "history") .
6982                                 " | " .
6983                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6984                                         "raw") .
6985                                 " | " .
6986                                 $cgi->a({-href => href(action=>"blob",
6987                                                        hash_base=>"HEAD", file_name=>$file_name)},
6988                                         "HEAD");
6989                 } else {
6990                         $formats_nav .=
6991                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6992                                         "raw");
6993                 }
6994                 git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6995                 git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6996         } else {
6997                 print "<div class=\"page_nav\">\n" .
6998                       "<br/><br/></div>\n" .
6999                       "<div class=\"title\">".esc_html($hash)."</div>\n";
7000         }
7001         git_print_page_path($file_name, "blob", $hash_base);
7002         print "<div class=\"page_body\">\n";
7003         if ($mimetype =~ m!^image/!) {
7004                 print qq!<img type="!.esc_attr($mimetype).qq!"!;
7005                 if ($file_name) {
7006                         print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
7007                 }
7008                 print qq! src="! .
7009                       href(action=>"blob_plain", hash=>$hash,
7010                            hash_base=>$hash_base, file_name=>$file_name) .
7011                       qq!" />\n!;
7012         } else {
7013                 my $nr;
7014                 while (my $line = <$fd>) {
7015                         chomp $line;
7016                         $nr++;
7017                         $line = untabify($line);
7018                         printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
7019                                $nr, esc_attr(href(-replay => 1)), $nr, $nr,
7020                                $syntax ? sanitize($line) : esc_html($line, -nbsp=>1);
7021                 }
7022         }
7023         close $fd
7024                 or print "Reading blob failed.\n";
7025         print "</div>";
7026         git_footer_html();
7027 }
7028
7029 sub git_tree {
7030         if (!defined $hash_base) {
7031                 $hash_base = "HEAD";
7032         }
7033         if (!defined $hash) {
7034                 if (defined $file_name) {
7035                         $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
7036                 } else {
7037                         $hash = $hash_base;
7038                 }
7039         }
7040         die_error(404, "No such tree") unless defined($hash);
7041
7042         my $show_sizes = gitweb_check_feature('show-sizes');
7043         my $have_blame = gitweb_check_feature('blame');
7044
7045         my @entries = ();
7046         {
7047                 local $/ = "\0";
7048                 open my $fd, "-|", git_cmd(), "ls-tree", '-z',
7049                         ($show_sizes ? '-l' : ()), @extra_options, $hash
7050                         or die_error(500, "Open git-ls-tree failed");
7051                 @entries = map { chomp; $_ } <$fd>;
7052                 close $fd
7053                         or die_error(404, "Reading tree failed");
7054         }
7055
7056         my $refs = git_get_references();
7057         my $ref = format_ref_marker($refs, $hash_base);
7058         git_header_html();
7059         my $basedir = '';
7060         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7061                 my @views_nav = ();
7062                 if (defined $file_name) {
7063                         push @views_nav,
7064                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
7065                                         "history"),
7066                                 $cgi->a({-href => href(action=>"tree",
7067                                                        hash_base=>"HEAD", file_name=>$file_name)},
7068                                         "HEAD"),
7069                 }
7070                 my $snapshot_links = format_snapshot_links($hash);
7071                 if (defined $snapshot_links) {
7072                         # FIXME: Should be available when we have no hash base as well.
7073                         push @views_nav, $snapshot_links;
7074                 }
7075                 git_print_page_nav('tree','', $hash_base, undef, undef,
7076                                    join(' | ', @views_nav));
7077                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
7078         } else {
7079                 undef $hash_base;
7080                 print "<div class=\"page_nav\">\n";
7081                 print "<br/><br/></div>\n";
7082                 print "<div class=\"title\">".esc_html($hash)."</div>\n";
7083         }
7084         if (defined $file_name) {
7085                 $basedir = $file_name;
7086                 if ($basedir ne '' && substr($basedir, -1) ne '/') {
7087                         $basedir .= '/';
7088                 }
7089                 git_print_page_path($file_name, 'tree', $hash_base);
7090         }
7091         print "<div class=\"page_body\">\n";
7092         print "<table class=\"tree\">\n";
7093         my $alternate = 1;
7094         # '..' (top directory) link if possible
7095         if (defined $hash_base &&
7096             defined $file_name && $file_name =~ m![^/]+$!) {
7097                 if ($alternate) {
7098                         print "<tr class=\"dark\">\n";
7099                 } else {
7100                         print "<tr class=\"light\">\n";
7101                 }
7102                 $alternate ^= 1;
7103
7104                 my $up = $file_name;
7105                 $up =~ s!/?[^/]+$!!;
7106                 undef $up unless $up;
7107                 # based on git_print_tree_entry
7108                 print '<td class="mode">' . mode_str('040000') . "</td>\n";
7109                 print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
7110                 print '<td class="list">';
7111                 print $cgi->a({-href => href(action=>"tree",
7112                                              hash_base=>$hash_base,
7113                                              file_name=>$up)},
7114                               "..");
7115                 print "</td>\n";
7116                 print "<td class=\"link\"></td>\n";
7117
7118                 print "</tr>\n";
7119         }
7120         foreach my $line (@entries) {
7121                 my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
7122
7123                 if ($alternate) {
7124                         print "<tr class=\"dark\">\n";
7125                 } else {
7126                         print "<tr class=\"light\">\n";
7127                 }
7128                 $alternate ^= 1;
7129
7130                 git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
7131
7132                 print "</tr>\n";
7133         }
7134         print "</table>\n" .
7135               "</div>";
7136         git_footer_html();
7137 }
7138
7139 sub snapshot_name {
7140         my ($project, $hash) = @_;
7141
7142         # path/to/project.git  -> project
7143         # path/to/project/.git -> project
7144         my $name = to_utf8($project);
7145         $name =~ s,([^/])/*\.git$,$1,;
7146         $name = basename($name);
7147         # sanitize name
7148         $name =~ s/[[:cntrl:]]/?/g;
7149
7150         my $ver = $hash;
7151         if ($hash =~ /^[0-9a-fA-F]+$/) {
7152                 # shorten SHA-1 hash
7153                 my $full_hash = git_get_full_hash($project, $hash);
7154                 if ($full_hash =~ /^$hash/ && length($hash) > 7) {
7155                         $ver = git_get_short_hash($project, $hash);
7156                 }
7157         } elsif ($hash =~ m!^refs/tags/(.*)$!) {
7158                 # tags don't need shortened SHA-1 hash
7159                 $ver = $1;
7160         } else {
7161                 # branches and other need shortened SHA-1 hash
7162                 if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
7163                         $ver = $1;
7164                 }
7165                 $ver .= '-' . git_get_short_hash($project, $hash);
7166         }
7167         # in case of hierarchical branch names
7168         $ver =~ s!/!.!g;
7169
7170         # name = project-version_string
7171         $name = "$name-$ver";
7172
7173         return wantarray ? ($name, $name) : $name;
7174 }
7175
7176 sub exit_if_unmodified_since {
7177         my ($latest_epoch) = @_;
7178         our $cgi;
7179
7180         my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7181         if (defined $if_modified) {
7182                 my $since;
7183                 if (eval { require HTTP::Date; 1; }) {
7184                         $since = HTTP::Date::str2time($if_modified);
7185                 } elsif (eval { require Time::ParseDate; 1; }) {
7186                         $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7187                 }
7188                 if (defined $since && $latest_epoch <= $since) {
7189                         my %latest_date = parse_date($latest_epoch);
7190                         print $cgi->header(
7191                                 -last_modified => $latest_date{'rfc2822'},
7192                                 -status => '304 Not Modified');
7193                         goto DONE_GITWEB;
7194                 }
7195         }
7196 }
7197
7198 sub git_snapshot {
7199         my $format = $input_params{'snapshot_format'};
7200         if (!@snapshot_fmts) {
7201                 die_error(403, "Snapshots not allowed");
7202         }
7203         # default to first supported snapshot format
7204         $format ||= $snapshot_fmts[0];
7205         if ($format !~ m/^[a-z0-9]+$/) {
7206                 die_error(400, "Invalid snapshot format parameter");
7207         } elsif (!exists($known_snapshot_formats{$format})) {
7208                 die_error(400, "Unknown snapshot format");
7209         } elsif ($known_snapshot_formats{$format}{'disabled'}) {
7210                 die_error(403, "Snapshot format not allowed");
7211         } elsif (!grep($_ eq $format, @snapshot_fmts)) {
7212                 die_error(403, "Unsupported snapshot format");
7213         }
7214
7215         my $type = git_get_type("$hash^{}");
7216         if (!$type) {
7217                 die_error(404, 'Object does not exist');
7218         }  elsif ($type eq 'blob') {
7219                 die_error(400, 'Object is not a tree-ish');
7220         }
7221
7222         my ($name, $prefix) = snapshot_name($project, $hash);
7223         my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
7224
7225         my %co = parse_commit($hash);
7226         exit_if_unmodified_since($co{'committer_epoch'}) if %co;
7227
7228         my $cmd = quote_command(
7229                 git_cmd(), 'archive',
7230                 "--format=$known_snapshot_formats{$format}{'format'}",
7231                 "--prefix=$prefix/", $hash);
7232         if (exists $known_snapshot_formats{$format}{'compressor'}) {
7233                 $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
7234         }
7235
7236         $filename =~ s/(["\\])/\\$1/g;
7237         my %latest_date;
7238         if (%co) {
7239                 %latest_date = parse_date($co{'committer_epoch'}, $co{'committer_tz'});
7240         }
7241
7242         print $cgi->header(
7243                 -type => $known_snapshot_formats{$format}{'type'},
7244                 -content_disposition => 'inline; filename="' . $filename . '"',
7245                 %co ? (-last_modified => $latest_date{'rfc2822'}) : (),
7246                 -status => '200 OK');
7247
7248         open my $fd, "-|", $cmd
7249                 or die_error(500, "Execute git-archive failed");
7250         binmode STDOUT, ':raw';
7251         print <$fd>;
7252         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
7253         close $fd;
7254 }
7255
7256 sub git_log_generic {
7257         my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
7258
7259         my $head = git_get_head_hash($project);
7260         if (!defined $base) {
7261                 $base = $head;
7262         }
7263         if (!defined $page) {
7264                 $page = 0;
7265         }
7266         my $refs = git_get_references();
7267
7268         my $commit_hash = $base;
7269         if (defined $parent) {
7270                 $commit_hash = "$parent..$base";
7271         }
7272         my @commitlist =
7273                 parse_commits($commit_hash, 101, (100 * $page),
7274                               defined $file_name ? ($file_name, "--full-history") : ());
7275
7276         my $ftype;
7277         if (!defined $file_hash && defined $file_name) {
7278                 # some commits could have deleted file in question,
7279                 # and not have it in tree, but one of them has to have it
7280                 for (my $i = 0; $i < @commitlist; $i++) {
7281                         $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
7282                         last if defined $file_hash;
7283                 }
7284         }
7285         if (defined $file_hash) {
7286                 $ftype = git_get_type($file_hash);
7287         }
7288         if (defined $file_name && !defined $ftype) {
7289                 die_error(500, "Unknown type of object");
7290         }
7291         my %co;
7292         if (defined $file_name) {
7293                 %co = parse_commit($base)
7294                         or die_error(404, "Unknown commit object");
7295         }
7296
7297
7298         my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
7299         my $next_link = '';
7300         if ($#commitlist >= 100) {
7301                 $next_link =
7302                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
7303                                  -accesskey => "n", -title => "Alt-n"}, "next");
7304         }
7305         my $patch_max = gitweb_get_feature('patches');
7306         if ($patch_max && !defined $file_name) {
7307                 if ($patch_max < 0 || @commitlist <= $patch_max) {
7308                         $paging_nav .= " &sdot; " .
7309                                 $cgi->a({-href => href(action=>"patches", -replay=>1)},
7310                                         "patches");
7311                 }
7312         }
7313
7314         git_header_html();
7315         git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
7316         if (defined $file_name) {
7317                 git_print_header_div('commit', esc_html($co{'title'}), $base);
7318         } else {
7319                 git_print_header_div('summary', $project)
7320         }
7321         git_print_page_path($file_name, $ftype, $hash_base)
7322                 if (defined $file_name);
7323
7324         $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
7325                      $file_name, $file_hash, $ftype);
7326
7327         git_footer_html();
7328 }
7329
7330 sub git_log {
7331         git_log_generic('log', \&git_log_body,
7332                         $hash, $hash_parent);
7333 }
7334
7335 sub git_commit {
7336         $hash ||= $hash_base || "HEAD";
7337         my %co = parse_commit($hash)
7338             or die_error(404, "Unknown commit object");
7339
7340         my $parent  = $co{'parent'};
7341         my $parents = $co{'parents'}; # listref
7342
7343         # we need to prepare $formats_nav before any parameter munging
7344         my $formats_nav;
7345         if (!defined $parent) {
7346                 # --root commitdiff
7347                 $formats_nav .= '(initial)';
7348         } elsif (@$parents == 1) {
7349                 # single parent commit
7350                 $formats_nav .=
7351                         '(parent: ' .
7352                         $cgi->a({-href => href(action=>"commit",
7353                                                hash=>$parent)},
7354                                 esc_html(substr($parent, 0, 7))) .
7355                         ')';
7356         } else {
7357                 # merge commit
7358                 $formats_nav .=
7359                         '(merge: ' .
7360                         join(' ', map {
7361                                 $cgi->a({-href => href(action=>"commit",
7362                                                        hash=>$_)},
7363                                         esc_html(substr($_, 0, 7)));
7364                         } @$parents ) .
7365                         ')';
7366         }
7367         if (gitweb_check_feature('patches') && @$parents <= 1) {
7368                 $formats_nav .= " | " .
7369                         $cgi->a({-href => href(action=>"patch", -replay=>1)},
7370                                 "patch");
7371         }
7372
7373         if (!defined $parent) {
7374                 $parent = "--root";
7375         }
7376         my @difftree;
7377         open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
7378                 @diff_opts,
7379                 (@$parents <= 1 ? $parent : '-c'),
7380                 $hash, "--"
7381                 or die_error(500, "Open git-diff-tree failed");
7382         @difftree = map { chomp; $_ } <$fd>;
7383         close $fd or die_error(404, "Reading git-diff-tree failed");
7384
7385         # non-textual hash id's can be cached
7386         my $expires;
7387         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7388                 $expires = "+1d";
7389         }
7390         my $refs = git_get_references();
7391         my $ref = format_ref_marker($refs, $co{'id'});
7392
7393         git_header_html(undef, $expires);
7394         git_print_page_nav('commit', '',
7395                            $hash, $co{'tree'}, $hash,
7396                            $formats_nav);
7397
7398         if (defined $co{'parent'}) {
7399                 git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
7400         } else {
7401                 git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
7402         }
7403         print "<div class=\"title_text\">\n" .
7404               "<table class=\"object_header\">\n";
7405         git_print_authorship_rows(\%co);
7406         print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
7407         print "<tr>" .
7408               "<td>tree</td>" .
7409               "<td class=\"sha1\">" .
7410               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7411                        class => "list"}, $co{'tree'}) .
7412               "</td>" .
7413               "<td class=\"link\">" .
7414               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7415                       "tree");
7416         my $snapshot_links = format_snapshot_links($hash);
7417         if (defined $snapshot_links) {
7418                 print " | " . $snapshot_links;
7419         }
7420         print "</td>" .
7421               "</tr>\n";
7422
7423         foreach my $par (@$parents) {
7424                 print "<tr>" .
7425                       "<td>parent</td>" .
7426                       "<td class=\"sha1\">" .
7427                       $cgi->a({-href => href(action=>"commit", hash=>$par),
7428                                class => "list"}, $par) .
7429                       "</td>" .
7430                       "<td class=\"link\">" .
7431                       $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7432                       " | " .
7433                       $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7434                       "</td>" .
7435                       "</tr>\n";
7436         }
7437         print "</table>".
7438               "</div>\n";
7439
7440         print "<div class=\"page_body\">\n";
7441         git_print_log($co{'comment'});
7442         print "</div>\n";
7443
7444         git_difftree_body(\@difftree, $hash, @$parents);
7445
7446         git_footer_html();
7447 }
7448
7449 sub git_object {
7450         # object is defined by:
7451         # - hash or hash_base alone
7452         # - hash_base and file_name
7453         my $type;
7454
7455         # - hash or hash_base alone
7456         if ($hash || ($hash_base && !defined $file_name)) {
7457                 my $object_id = $hash || $hash_base;
7458
7459                 open my $fd, "-|", quote_command(
7460                         git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7461                         or die_error(404, "Object does not exist");
7462                 $type = <$fd>;
7463                 chomp $type;
7464                 close $fd
7465                         or die_error(404, "Object does not exist");
7466
7467         # - hash_base and file_name
7468         } elsif ($hash_base && defined $file_name) {
7469                 $file_name =~ s,/+$,,;
7470
7471                 system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7472                         or die_error(404, "Base object does not exist");
7473
7474                 # here errors should not hapen
7475                 open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7476                         or die_error(500, "Open git-ls-tree failed");
7477                 my $line = <$fd>;
7478                 close $fd;
7479
7480                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7481                 unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7482                         die_error(404, "File or directory for given base does not exist");
7483                 }
7484                 $type = $2;
7485                 $hash = $3;
7486         } else {
7487                 die_error(400, "Not enough information to find object");
7488         }
7489
7490         print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7491                                           hash=>$hash, hash_base=>$hash_base,
7492                                           file_name=>$file_name),
7493                              -status => '302 Found');
7494 }
7495
7496 sub git_blobdiff {
7497         my $format = shift || 'html';
7498         my $diff_style = $input_params{'diff_style'} || 'inline';
7499
7500         my $fd;
7501         my @difftree;
7502         my %diffinfo;
7503         my $expires;
7504
7505         # preparing $fd and %diffinfo for git_patchset_body
7506         # new style URI
7507         if (defined $hash_base && defined $hash_parent_base) {
7508                 if (defined $file_name) {
7509                         # read raw output
7510                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7511                                 $hash_parent_base, $hash_base,
7512                                 "--", (defined $file_parent ? $file_parent : ()), $file_name
7513                                 or die_error(500, "Open git-diff-tree failed");
7514                         @difftree = map { chomp; $_ } <$fd>;
7515                         close $fd
7516                                 or die_error(404, "Reading git-diff-tree failed");
7517                         @difftree
7518                                 or die_error(404, "Blob diff not found");
7519
7520                 } elsif (defined $hash &&
7521                          $hash =~ /[0-9a-fA-F]{40}/) {
7522                         # try to find filename from $hash
7523
7524                         # read filtered raw output
7525                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7526                                 $hash_parent_base, $hash_base, "--"
7527                                 or die_error(500, "Open git-diff-tree failed");
7528                         @difftree =
7529                                 # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7530                                 # $hash == to_id
7531                                 grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7532                                 map { chomp; $_ } <$fd>;
7533                         close $fd
7534                                 or die_error(404, "Reading git-diff-tree failed");
7535                         @difftree
7536                                 or die_error(404, "Blob diff not found");
7537
7538                 } else {
7539                         die_error(400, "Missing one of the blob diff parameters");
7540                 }
7541
7542                 if (@difftree > 1) {
7543                         die_error(400, "Ambiguous blob diff specification");
7544                 }
7545
7546                 %diffinfo = parse_difftree_raw_line($difftree[0]);
7547                 $file_parent ||= $diffinfo{'from_file'} || $file_name;
7548                 $file_name   ||= $diffinfo{'to_file'};
7549
7550                 $hash_parent ||= $diffinfo{'from_id'};
7551                 $hash        ||= $diffinfo{'to_id'};
7552
7553                 # non-textual hash id's can be cached
7554                 if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7555                     $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7556                         $expires = '+1d';
7557                 }
7558
7559                 # open patch output
7560                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7561                         '-p', ($format eq 'html' ? "--full-index" : ()),
7562                         $hash_parent_base, $hash_base,
7563                         "--", (defined $file_parent ? $file_parent : ()), $file_name
7564                         or die_error(500, "Open git-diff-tree failed");
7565         }
7566
7567         # old/legacy style URI -- not generated anymore since 1.4.3.
7568         if (!%diffinfo) {
7569                 die_error('404 Not Found', "Missing one of the blob diff parameters")
7570         }
7571
7572         # header
7573         if ($format eq 'html') {
7574                 my $formats_nav =
7575                         $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7576                                 "raw");
7577                 $formats_nav .= diff_style_nav($diff_style);
7578                 git_header_html(undef, $expires);
7579                 if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7580                         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7581                         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7582                 } else {
7583                         print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7584                         print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7585                 }
7586                 if (defined $file_name) {
7587                         git_print_page_path($file_name, "blob", $hash_base);
7588                 } else {
7589                         print "<div class=\"page_path\"></div>\n";
7590                 }
7591
7592         } elsif ($format eq 'plain') {
7593                 print $cgi->header(
7594                         -type => 'text/plain',
7595                         -charset => 'utf-8',
7596                         -expires => $expires,
7597                         -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7598
7599                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7600
7601         } else {
7602                 die_error(400, "Unknown blobdiff format");
7603         }
7604
7605         # patch
7606         if ($format eq 'html') {
7607                 print "<div class=\"page_body\">\n";
7608
7609                 git_patchset_body($fd, $diff_style,
7610                                   [ \%diffinfo ], $hash_base, $hash_parent_base);
7611                 close $fd;
7612
7613                 print "</div>\n"; # class="page_body"
7614                 git_footer_html();
7615
7616         } else {
7617                 while (my $line = <$fd>) {
7618                         $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7619                         $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7620
7621                         print $line;
7622
7623                         last if $line =~ m!^\+\+\+!;
7624                 }
7625                 local $/ = undef;
7626                 print <$fd>;
7627                 close $fd;
7628         }
7629 }
7630
7631 sub git_blobdiff_plain {
7632         git_blobdiff('plain');
7633 }
7634
7635 # assumes that it is added as later part of already existing navigation,
7636 # so it returns "| foo | bar" rather than just "foo | bar"
7637 sub diff_style_nav {
7638         my ($diff_style, $is_combined) = @_;
7639         $diff_style ||= 'inline';
7640
7641         return "" if ($is_combined);
7642
7643         my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7644         my %styles = @styles;
7645         @styles =
7646                 @styles[ map { $_ * 2 } 0..$#styles/2 ];
7647
7648         return join '',
7649                 map { " | ".$_ }
7650                 map {
7651                         $_ eq $diff_style ? $styles{$_} :
7652                         $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7653                 } @styles;
7654 }
7655
7656 sub git_commitdiff {
7657         my %params = @_;
7658         my $format = $params{-format} || 'html';
7659         my $diff_style = $input_params{'diff_style'} || 'inline';
7660
7661         my ($patch_max) = gitweb_get_feature('patches');
7662         if ($format eq 'patch') {
7663                 die_error(403, "Patch view not allowed") unless $patch_max;
7664         }
7665
7666         $hash ||= $hash_base || "HEAD";
7667         my %co = parse_commit($hash)
7668             or die_error(404, "Unknown commit object");
7669
7670         # choose format for commitdiff for merge
7671         if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7672                 $hash_parent = '--cc';
7673         }
7674         # we need to prepare $formats_nav before almost any parameter munging
7675         my $formats_nav;
7676         if ($format eq 'html') {
7677                 $formats_nav =
7678                         $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7679                                 "raw");
7680                 if ($patch_max && @{$co{'parents'}} <= 1) {
7681                         $formats_nav .= " | " .
7682                                 $cgi->a({-href => href(action=>"patch", -replay=>1)},
7683                                         "patch");
7684                 }
7685                 $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7686
7687                 if (defined $hash_parent &&
7688                     $hash_parent ne '-c' && $hash_parent ne '--cc') {
7689                         # commitdiff with two commits given
7690                         my $hash_parent_short = $hash_parent;
7691                         if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7692                                 $hash_parent_short = substr($hash_parent, 0, 7);
7693                         }
7694                         $formats_nav .=
7695                                 ' (from';
7696                         for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7697                                 if ($co{'parents'}[$i] eq $hash_parent) {
7698                                         $formats_nav .= ' parent ' . ($i+1);
7699                                         last;
7700                                 }
7701                         }
7702                         $formats_nav .= ': ' .
7703                                 $cgi->a({-href => href(-replay=>1,
7704                                                        hash=>$hash_parent, hash_base=>undef)},
7705                                         esc_html($hash_parent_short)) .
7706                                 ')';
7707                 } elsif (!$co{'parent'}) {
7708                         # --root commitdiff
7709                         $formats_nav .= ' (initial)';
7710                 } elsif (scalar @{$co{'parents'}} == 1) {
7711                         # single parent commit
7712                         $formats_nav .=
7713                                 ' (parent: ' .
7714                                 $cgi->a({-href => href(-replay=>1,
7715                                                        hash=>$co{'parent'}, hash_base=>undef)},
7716                                         esc_html(substr($co{'parent'}, 0, 7))) .
7717                                 ')';
7718                 } else {
7719                         # merge commit
7720                         if ($hash_parent eq '--cc') {
7721                                 $formats_nav .= ' | ' .
7722                                         $cgi->a({-href => href(-replay=>1,
7723                                                                hash=>$hash, hash_parent=>'-c')},
7724                                                 'combined');
7725                         } else { # $hash_parent eq '-c'
7726                                 $formats_nav .= ' | ' .
7727                                         $cgi->a({-href => href(-replay=>1,
7728                                                                hash=>$hash, hash_parent=>'--cc')},
7729                                                 'compact');
7730                         }
7731                         $formats_nav .=
7732                                 ' (merge: ' .
7733                                 join(' ', map {
7734                                         $cgi->a({-href => href(-replay=>1,
7735                                                                hash=>$_, hash_base=>undef)},
7736                                                 esc_html(substr($_, 0, 7)));
7737                                 } @{$co{'parents'}} ) .
7738                                 ')';
7739                 }
7740         }
7741
7742         my $hash_parent_param = $hash_parent;
7743         if (!defined $hash_parent_param) {
7744                 # --cc for multiple parents, --root for parentless
7745                 $hash_parent_param =
7746                         @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7747         }
7748
7749         # read commitdiff
7750         my $fd;
7751         my @difftree;
7752         if ($format eq 'html') {
7753                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7754                         "--no-commit-id", "--patch-with-raw", "--full-index",
7755                         $hash_parent_param, $hash, "--"
7756                         or die_error(500, "Open git-diff-tree failed");
7757
7758                 while (my $line = <$fd>) {
7759                         chomp $line;
7760                         # empty line ends raw part of diff-tree output
7761                         last unless $line;
7762                         push @difftree, scalar parse_difftree_raw_line($line);
7763                 }
7764
7765         } elsif ($format eq 'plain') {
7766                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7767                         '-p', $hash_parent_param, $hash, "--"
7768                         or die_error(500, "Open git-diff-tree failed");
7769         } elsif ($format eq 'patch') {
7770                 # For commit ranges, we limit the output to the number of
7771                 # patches specified in the 'patches' feature.
7772                 # For single commits, we limit the output to a single patch,
7773                 # diverging from the git-format-patch default.
7774                 my @commit_spec = ();
7775                 if ($hash_parent) {
7776                         if ($patch_max > 0) {
7777                                 push @commit_spec, "-$patch_max";
7778                         }
7779                         push @commit_spec, '-n', "$hash_parent..$hash";
7780                 } else {
7781                         if ($params{-single}) {
7782                                 push @commit_spec, '-1';
7783                         } else {
7784                                 if ($patch_max > 0) {
7785                                         push @commit_spec, "-$patch_max";
7786                                 }
7787                                 push @commit_spec, "-n";
7788                         }
7789                         push @commit_spec, '--root', $hash;
7790                 }
7791                 open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7792                         '--encoding=utf8', '--stdout', @commit_spec
7793                         or die_error(500, "Open git-format-patch failed");
7794         } else {
7795                 die_error(400, "Unknown commitdiff format");
7796         }
7797
7798         # non-textual hash id's can be cached
7799         my $expires;
7800         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7801                 $expires = "+1d";
7802         }
7803
7804         # write commit message
7805         if ($format eq 'html') {
7806                 my $refs = git_get_references();
7807                 my $ref = format_ref_marker($refs, $co{'id'});
7808
7809                 git_header_html(undef, $expires);
7810                 git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7811                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7812                 print "<div class=\"title_text\">\n" .
7813                       "<table class=\"object_header\">\n";
7814                 git_print_authorship_rows(\%co);
7815                 print "</table>".
7816                       "</div>\n";
7817                 print "<div class=\"page_body\">\n";
7818                 if (@{$co{'comment'}} > 1) {
7819                         print "<div class=\"log\">\n";
7820                         git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7821                         print "</div>\n"; # class="log"
7822                 }
7823
7824         } elsif ($format eq 'plain') {
7825                 my $refs = git_get_references("tags");
7826                 my $tagname = git_get_rev_name_tags($hash);
7827                 my $filename = basename($project) . "-$hash.patch";
7828
7829                 print $cgi->header(
7830                         -type => 'text/plain',
7831                         -charset => 'utf-8',
7832                         -expires => $expires,
7833                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7834                 my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7835                 print "From: " . to_utf8($co{'author'}) . "\n";
7836                 print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7837                 print "Subject: " . to_utf8($co{'title'}) . "\n";
7838
7839                 print "X-Git-Tag: $tagname\n" if $tagname;
7840                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7841
7842                 foreach my $line (@{$co{'comment'}}) {
7843                         print to_utf8($line) . "\n";
7844                 }
7845                 print "---\n\n";
7846         } elsif ($format eq 'patch') {
7847                 my $filename = basename($project) . "-$hash.patch";
7848
7849                 print $cgi->header(
7850                         -type => 'text/plain',
7851                         -charset => 'utf-8',
7852                         -expires => $expires,
7853                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7854         }
7855
7856         # write patch
7857         if ($format eq 'html') {
7858                 my $use_parents = !defined $hash_parent ||
7859                         $hash_parent eq '-c' || $hash_parent eq '--cc';
7860                 git_difftree_body(\@difftree, $hash,
7861                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7862                 print "<br/>\n";
7863
7864                 git_patchset_body($fd, $diff_style,
7865                                   \@difftree, $hash,
7866                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7867                 close $fd;
7868                 print "</div>\n"; # class="page_body"
7869                 git_footer_html();
7870
7871         } elsif ($format eq 'plain') {
7872                 local $/ = undef;
7873                 print <$fd>;
7874                 close $fd
7875                         or print "Reading git-diff-tree failed\n";
7876         } elsif ($format eq 'patch') {
7877                 local $/ = undef;
7878                 print <$fd>;
7879                 close $fd
7880                         or print "Reading git-format-patch failed\n";
7881         }
7882 }
7883
7884 sub git_commitdiff_plain {
7885         git_commitdiff(-format => 'plain');
7886 }
7887
7888 # format-patch-style patches
7889 sub git_patch {
7890         git_commitdiff(-format => 'patch', -single => 1);
7891 }
7892
7893 sub git_patches {
7894         git_commitdiff(-format => 'patch');
7895 }
7896
7897 sub git_history {
7898         git_log_generic('history', \&git_history_body,
7899                         $hash_base, $hash_parent_base,
7900                         $file_name, $hash);
7901 }
7902
7903 sub git_search {
7904         $searchtype ||= 'commit';
7905
7906         # check if appropriate features are enabled
7907         gitweb_check_feature('search')
7908                 or die_error(403, "Search is disabled");
7909         if ($searchtype eq 'pickaxe') {
7910                 # pickaxe may take all resources of your box and run for several minutes
7911                 # with every query - so decide by yourself how public you make this feature
7912                 gitweb_check_feature('pickaxe')
7913                         or die_error(403, "Pickaxe search is disabled");
7914         }
7915         if ($searchtype eq 'grep') {
7916                 # grep search might be potentially CPU-intensive, too
7917                 gitweb_check_feature('grep')
7918                         or die_error(403, "Grep search is disabled");
7919         }
7920
7921         if (!defined $searchtext) {
7922                 die_error(400, "Text field is empty");
7923         }
7924         if (!defined $hash) {
7925                 $hash = git_get_head_hash($project);
7926         }
7927         my %co = parse_commit($hash);
7928         if (!%co) {
7929                 die_error(404, "Unknown commit object");
7930         }
7931         if (!defined $page) {
7932                 $page = 0;
7933         }
7934
7935         if ($searchtype eq 'commit' ||
7936             $searchtype eq 'author' ||
7937             $searchtype eq 'committer') {
7938                 git_search_message(%co);
7939         } elsif ($searchtype eq 'pickaxe') {
7940                 git_search_changes(%co);
7941         } elsif ($searchtype eq 'grep') {
7942                 git_search_files(%co);
7943         } else {
7944                 die_error(400, "Unknown search type");
7945         }
7946 }
7947
7948 sub git_search_help {
7949         git_header_html();
7950         git_print_page_nav('','', $hash,$hash,$hash);
7951         print <<EOT;
7952 <p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7953 regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7954 the pattern entered is recognized as the POSIX extended
7955 <a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7956 insensitive).</p>
7957 <dl>
7958 <dt><b>commit</b></dt>
7959 <dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7960 EOT
7961         my $have_grep = gitweb_check_feature('grep');
7962         if ($have_grep) {
7963                 print <<EOT;
7964 <dt><b>grep</b></dt>
7965 <dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7966     a different one) are searched for the given pattern. On large trees, this search can take
7967 a while and put some strain on the server, so please use it with some consideration. Note that
7968 due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7969 case-sensitive.</dd>
7970 EOT
7971         }
7972         print <<EOT;
7973 <dt><b>author</b></dt>
7974 <dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7975 <dt><b>committer</b></dt>
7976 <dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7977 EOT
7978         my $have_pickaxe = gitweb_check_feature('pickaxe');
7979         if ($have_pickaxe) {
7980                 print <<EOT;
7981 <dt><b>pickaxe</b></dt>
7982 <dd>All commits that caused the string to appear or disappear from any file (changes that
7983 added, removed or "modified" the string) will be listed. This search can take a while and
7984 takes a lot of strain on the server, so please use it wisely. Note that since you may be
7985 interested even in changes just changing the case as well, this search is case sensitive.</dd>
7986 EOT
7987         }
7988         print "</dl>\n";
7989         git_footer_html();
7990 }
7991
7992 sub git_shortlog {
7993         git_log_generic('shortlog', \&git_shortlog_body,
7994                         $hash, $hash_parent);
7995 }
7996
7997 ## ......................................................................
7998 ## feeds (RSS, Atom; OPML)
7999
8000 sub git_feed {
8001         my $format = shift || 'atom';
8002         my $have_blame = gitweb_check_feature('blame');
8003
8004         # Atom: http://www.atomenabled.org/developers/syndication/
8005         # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
8006         if ($format ne 'rss' && $format ne 'atom') {
8007                 die_error(400, "Unknown web feed format");
8008         }
8009
8010         # log/feed of current (HEAD) branch, log of given branch, history of file/directory
8011         my $head = $hash || 'HEAD';
8012         my @commitlist = parse_commits($head, 150, 0, $file_name);
8013
8014         my %latest_commit;
8015         my %latest_date;
8016         my $content_type = "application/$format+xml";
8017         if (defined $cgi->http('HTTP_ACCEPT') &&
8018                  $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
8019                 # browser (feed reader) prefers text/xml
8020                 $content_type = 'text/xml';
8021         }
8022         if (defined($commitlist[0])) {
8023                 %latest_commit = %{$commitlist[0]};
8024                 my $latest_epoch = $latest_commit{'committer_epoch'};
8025                 exit_if_unmodified_since($latest_epoch);
8026                 %latest_date = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
8027         }
8028         print $cgi->header(
8029                 -type => $content_type,
8030                 -charset => 'utf-8',
8031                 %latest_date ? (-last_modified => $latest_date{'rfc2822'}) : (),
8032                 -status => '200 OK');
8033
8034         # Optimization: skip generating the body if client asks only
8035         # for Last-Modified date.
8036         return if ($cgi->request_method() eq 'HEAD');
8037
8038         # header variables
8039         my $title = "$site_name - $project/$action";
8040         my $feed_type = 'log';
8041         if (defined $hash) {
8042                 $title .= " - '$hash'";
8043                 $feed_type = 'branch log';
8044                 if (defined $file_name) {
8045                         $title .= " :: $file_name";
8046                         $feed_type = 'history';
8047                 }
8048         } elsif (defined $file_name) {
8049                 $title .= " - $file_name";
8050                 $feed_type = 'history';
8051         }
8052         $title .= " $feed_type";
8053         my $descr = git_get_project_description($project);
8054         if (defined $descr) {
8055                 $descr = esc_html($descr);
8056         } else {
8057                 $descr = "$project " .
8058                          ($format eq 'rss' ? 'RSS' : 'Atom') .
8059                          " feed";
8060         }
8061         my $owner = git_get_project_owner($project);
8062         $owner = esc_html($owner);
8063
8064         #header
8065         my $alt_url;
8066         if (defined $file_name) {
8067                 $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
8068         } elsif (defined $hash) {
8069                 $alt_url = href(-full=>1, action=>"log", hash=>$hash);
8070         } else {
8071                 $alt_url = href(-full=>1, action=>"summary");
8072         }
8073         print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
8074         if ($format eq 'rss') {
8075                 print <<XML;
8076 <rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
8077 <channel>
8078 XML
8079                 print "<title>$title</title>\n" .
8080                       "<link>$alt_url</link>\n" .
8081                       "<description>$descr</description>\n" .
8082                       "<language>en</language>\n" .
8083                       # project owner is responsible for 'editorial' content
8084                       "<managingEditor>$owner</managingEditor>\n";
8085                 if (defined $logo || defined $favicon) {
8086                         # prefer the logo to the favicon, since RSS
8087                         # doesn't allow both
8088                         my $img = esc_url($logo || $favicon);
8089                         print "<image>\n" .
8090                               "<url>$img</url>\n" .
8091                               "<title>$title</title>\n" .
8092                               "<link>$alt_url</link>\n" .
8093                               "</image>\n";
8094                 }
8095                 if (%latest_date) {
8096                         print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
8097                         print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
8098                 }
8099                 print "<generator>gitweb v.$version/$git_version</generator>\n";
8100         } elsif ($format eq 'atom') {
8101                 print <<XML;
8102 <feed xmlns="http://www.w3.org/2005/Atom">
8103 XML
8104                 print "<title>$title</title>\n" .
8105                       "<subtitle>$descr</subtitle>\n" .
8106                       '<link rel="alternate" type="text/html" href="' .
8107                       $alt_url . '" />' . "\n" .
8108                       '<link rel="self" type="' . $content_type . '" href="' .
8109                       $cgi->self_url() . '" />' . "\n" .
8110                       "<id>" . href(-full=>1) . "</id>\n" .
8111                       # use project owner for feed author
8112                       "<author><name>$owner</name></author>\n";
8113                 if (defined $favicon) {
8114                         print "<icon>" . esc_url($favicon) . "</icon>\n";
8115                 }
8116                 if (defined $logo) {
8117                         # not twice as wide as tall: 72 x 27 pixels
8118                         print "<logo>" . esc_url($logo) . "</logo>\n";
8119                 }
8120                 if (! %latest_date) {
8121                         # dummy date to keep the feed valid until commits trickle in:
8122                         print "<updated>1970-01-01T00:00:00Z</updated>\n";
8123                 } else {
8124                         print "<updated>$latest_date{'iso-8601'}</updated>\n";
8125                 }
8126                 print "<generator version='$version/$git_version'>gitweb</generator>\n";
8127         }
8128
8129         # contents
8130         for (my $i = 0; $i <= $#commitlist; $i++) {
8131                 my %co = %{$commitlist[$i]};
8132                 my $commit = $co{'id'};
8133                 # we read 150, we always show 30 and the ones more recent than 48 hours
8134                 if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
8135                         last;
8136                 }
8137                 my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
8138
8139                 # get list of changed files
8140                 open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
8141                         $co{'parent'} || "--root",
8142                         $co{'id'}, "--", (defined $file_name ? $file_name : ())
8143                         or next;
8144                 my @difftree = map { chomp; $_ } <$fd>;
8145                 close $fd
8146                         or next;
8147
8148                 # print element (entry, item)
8149                 my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
8150                 if ($format eq 'rss') {
8151                         print "<item>\n" .
8152                               "<title>" . esc_html($co{'title'}) . "</title>\n" .
8153                               "<author>" . esc_html($co{'author'}) . "</author>\n" .
8154                               "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
8155                               "<guid isPermaLink=\"true\">$co_url</guid>\n" .
8156                               "<link>$co_url</link>\n" .
8157                               "<description>" . esc_html($co{'title'}) . "</description>\n" .
8158                               "<content:encoded>" .
8159                               "<![CDATA[\n";
8160                 } elsif ($format eq 'atom') {
8161                         print "<entry>\n" .
8162                               "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
8163                               "<updated>$cd{'iso-8601'}</updated>\n" .
8164                               "<author>\n" .
8165                               "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
8166                         if ($co{'author_email'}) {
8167                                 print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
8168                         }
8169                         print "</author>\n" .
8170                               # use committer for contributor
8171                               "<contributor>\n" .
8172                               "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
8173                         if ($co{'committer_email'}) {
8174                                 print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
8175                         }
8176                         print "</contributor>\n" .
8177                               "<published>$cd{'iso-8601'}</published>\n" .
8178                               "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
8179                               "<id>$co_url</id>\n" .
8180                               "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
8181                               "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
8182                 }
8183                 my $comment = $co{'comment'};
8184                 print "<pre>\n";
8185                 foreach my $line (@$comment) {
8186                         $line = esc_html($line);
8187                         print "$line\n";
8188                 }
8189                 print "</pre><ul>\n";
8190                 foreach my $difftree_line (@difftree) {
8191                         my %difftree = parse_difftree_raw_line($difftree_line);
8192                         next if !$difftree{'from_id'};
8193
8194                         my $file = $difftree{'file'} || $difftree{'to_file'};
8195
8196                         print "<li>" .
8197                               "[" .
8198                               $cgi->a({-href => href(-full=>1, action=>"blobdiff",
8199                                                      hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
8200                                                      hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
8201                                                      file_name=>$file, file_parent=>$difftree{'from_file'}),
8202                                       -title => "diff"}, 'D');
8203                         if ($have_blame) {
8204                                 print $cgi->a({-href => href(-full=>1, action=>"blame",
8205                                                              file_name=>$file, hash_base=>$commit),
8206                                               -title => "blame"}, 'B');
8207                         }
8208                         # if this is not a feed of a file history
8209                         if (!defined $file_name || $file_name ne $file) {
8210                                 print $cgi->a({-href => href(-full=>1, action=>"history",
8211                                                              file_name=>$file, hash=>$commit),
8212                                               -title => "history"}, 'H');
8213                         }
8214                         $file = esc_path($file);
8215                         print "] ".
8216                               "$file</li>\n";
8217                 }
8218                 if ($format eq 'rss') {
8219                         print "</ul>]]>\n" .
8220                               "</content:encoded>\n" .
8221                               "</item>\n";
8222                 } elsif ($format eq 'atom') {
8223                         print "</ul>\n</div>\n" .
8224                               "</content>\n" .
8225                               "</entry>\n";
8226                 }
8227         }
8228
8229         # end of feed
8230         if ($format eq 'rss') {
8231                 print "</channel>\n</rss>\n";
8232         } elsif ($format eq 'atom') {
8233                 print "</feed>\n";
8234         }
8235 }
8236
8237 sub git_rss {
8238         git_feed('rss');
8239 }
8240
8241 sub git_atom {
8242         git_feed('atom');
8243 }
8244
8245 sub git_opml {
8246         my @list = git_get_projects_list($project_filter, $strict_export);
8247         if (!@list) {
8248                 die_error(404, "No projects found");
8249         }
8250
8251         print $cgi->header(
8252                 -type => 'text/xml',
8253                 -charset => 'utf-8',
8254                 -content_disposition => 'inline; filename="opml.xml"');
8255
8256         my $title = esc_html($site_name);
8257         my $filter = " within subdirectory ";
8258         if (defined $project_filter) {
8259                 $filter .= esc_html($project_filter);
8260         } else {
8261                 $filter = "";
8262         }
8263         print <<XML;
8264 <?xml version="1.0" encoding="utf-8"?>
8265 <opml version="1.0">
8266 <head>
8267   <title>$title OPML Export$filter</title>
8268 </head>
8269 <body>
8270 <outline text="git RSS feeds">
8271 XML
8272
8273         foreach my $pr (@list) {
8274                 my %proj = %$pr;
8275                 my $head = git_get_head_hash($proj{'path'});
8276                 if (!defined $head) {
8277                         next;
8278                 }
8279                 $git_dir = "$projectroot/$proj{'path'}";
8280                 my %co = parse_commit($head);
8281                 if (!%co) {
8282                         next;
8283                 }
8284
8285                 my $path = esc_html(chop_str($proj{'path'}, 25, 5));
8286                 my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
8287                 my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
8288                 print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
8289         }
8290         print <<XML;
8291 </outline>
8292 </body>
8293 </opml>
8294 XML
8295 }