Sync with v2.2.1
[git.git] / gitweb / gitweb.perl
1 #!/usr/bin/perl
2
3 # gitweb - simple web interface to track changes in git repositories
4 #
5 # (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
6 # (C) 2005, Christian Gierke
7 #
8 # This program is licensed under the GPLv2
9
10 use 5.008;
11 use strict;
12 use warnings;
13 use CGI qw(:standard :escapeHTML -nosticky);
14 use CGI::Util qw(unescape);
15 use CGI::Carp qw(fatalsToBrowser set_message);
16 use Encode;
17 use Fcntl ':mode';
18 use File::Find qw();
19 use File::Basename qw(basename);
20 use Time::HiRes qw(gettimeofday tv_interval);
21 binmode STDOUT, ':utf8';
22
23 if (!defined($CGI::VERSION) || $CGI::VERSION < 4.08) {
24 eval 'sub CGI::multi_param { CGI::param(@_) }'
25 }
26
27 our $t0 = [ gettimeofday() ];
28 our $number_of_git_cmds = 0;
29
30 BEGIN {
31 CGI->compile() if $ENV{'MOD_PERL'};
32 }
33
34 our $version = "++GIT_VERSION++";
35
36 our ($my_url, $my_uri, $base_url, $path_info, $home_link);
37 sub evaluate_uri {
38 our $cgi;
39
40 our $my_url = $cgi->url();
41 our $my_uri = $cgi->url(-absolute => 1);
42
43 # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
44 # needed and used only for URLs with nonempty PATH_INFO
45 our $base_url = $my_url;
46
47 # When the script is used as DirectoryIndex, the URL does not contain the name
48 # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
49 # have to do it ourselves. We make $path_info global because it's also used
50 # later on.
51 #
52 # Another issue with the script being the DirectoryIndex is that the resulting
53 # $my_url data is not the full script URL: this is good, because we want
54 # generated links to keep implying the script name if it wasn't explicitly
55 # indicated in the URL we're handling, but it means that $my_url cannot be used
56 # as base URL.
57 # Therefore, if we needed to strip PATH_INFO, then we know that we have
58 # to build the base URL ourselves:
59 our $path_info = decode_utf8($ENV{"PATH_INFO"});
60 if ($path_info) {
61 # $path_info has already been URL-decoded by the web server, but
62 # $my_url and $my_uri have not. URL-decode them so we can properly
63 # strip $path_info.
64 $my_url = unescape($my_url);
65 $my_uri = unescape($my_uri);
66 if ($my_url =~ s,\Q$path_info\E$,, &&
67 $my_uri =~ s,\Q$path_info\E$,, &&
68 defined $ENV{'SCRIPT_NAME'}) {
69 $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
70 }
71 }
72
73 # target of the home link on top of all pages
74 our $home_link = $my_uri || "/";
75 }
76
77 # core git executable to use
78 # this can just be "git" if your webserver has a sensible PATH
79 our $GIT = "++GIT_BINDIR++/git";
80
81 # absolute fs-path which will be prepended to the project path
82 #our $projectroot = "/pub/scm";
83 our $projectroot = "++GITWEB_PROJECTROOT++";
84
85 # fs traversing limit for getting project list
86 # the number is relative to the projectroot
87 our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
88
89 # string of the home link on top of all pages
90 our $home_link_str = "++GITWEB_HOME_LINK_STR++";
91
92 # extra breadcrumbs preceding the home link
93 our @extra_breadcrumbs = ();
94
95 # name of your site or organization to appear in page titles
96 # replace this with something more descriptive for clearer bookmarks
97 our $site_name = "++GITWEB_SITENAME++"
98 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
99
100 # html snippet to include in the <head> section of each page
101 our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
102 # filename of html text to include at top of each page
103 our $site_header = "++GITWEB_SITE_HEADER++";
104 # html text to include at home page
105 our $home_text = "++GITWEB_HOMETEXT++";
106 # filename of html text to include at bottom of each page
107 our $site_footer = "++GITWEB_SITE_FOOTER++";
108
109 # URI of stylesheets
110 our @stylesheets = ("++GITWEB_CSS++");
111 # URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
112 our $stylesheet = undef;
113 # URI of GIT logo (72x27 size)
114 our $logo = "++GITWEB_LOGO++";
115 # URI of GIT favicon, assumed to be image/png type
116 our $favicon = "++GITWEB_FAVICON++";
117 # URI of gitweb.js (JavaScript code for gitweb)
118 our $javascript = "++GITWEB_JS++";
119
120 # URI and label (title) of GIT logo link
121 #our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
122 #our $logo_label = "git documentation";
123 our $logo_url = "http://git-scm.com/";
124 our $logo_label = "git homepage";
125
126 # source of projects list
127 our $projects_list = "++GITWEB_LIST++";
128
129 # the width (in characters) of the projects list "Description" column
130 our $projects_list_description_width = 25;
131
132 # group projects by category on the projects list
133 # (enabled if this variable evaluates to true)
134 our $projects_list_group_categories = 0;
135
136 # default category if none specified
137 # (leave the empty string for no category)
138 our $project_list_default_category = "";
139
140 # default order of projects list
141 # valid values are none, project, descr, owner, and age
142 our $default_projects_order = "project";
143
144 # show repository only if this file exists
145 # (only effective if this variable evaluates to true)
146 our $export_ok = "++GITWEB_EXPORT_OK++";
147
148 # don't generate age column on the projects list page
149 our $omit_age_column = 0;
150
151 # don't generate information about owners of repositories
152 our $omit_owner=0;
153
154 # show repository only if this subroutine returns true
155 # when given the path to the project, for example:
156 # sub { return -e "$_[0]/git-daemon-export-ok"; }
157 our $export_auth_hook = undef;
158
159 # only allow viewing of repositories also shown on the overview page
160 our $strict_export = "++GITWEB_STRICT_EXPORT++";
161
162 # list of git base URLs used for URL to where fetch project from,
163 # i.e. full URL is "$git_base_url/$project"
164 our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
165
166 # default blob_plain mimetype and default charset for text/plain blob
167 our $default_blob_plain_mimetype = 'text/plain';
168 our $default_text_plain_charset = undef;
169
170 # file to use for guessing MIME types before trying /etc/mime.types
171 # (relative to the current git repository)
172 our $mimetypes_file = undef;
173
174 # assume this charset if line contains non-UTF-8 characters;
175 # it should be valid encoding (see Encoding::Supported(3pm) for list),
176 # for which encoding all byte sequences are valid, for example
177 # 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
178 # could be even 'utf-8' for the old behavior)
179 our $fallback_encoding = 'latin1';
180
181 # rename detection options for git-diff and git-diff-tree
182 # - default is '-M', with the cost proportional to
183 # (number of removed files) * (number of new files).
184 # - more costly is '-C' (which implies '-M'), with the cost proportional to
185 # (number of changed files + number of removed files) * (number of new files)
186 # - even more costly is '-C', '--find-copies-harder' with cost
187 # (number of files in the original tree) * (number of new files)
188 # - one might want to include '-B' option, e.g. '-B', '-M'
189 our @diff_opts = ('-M'); # taken from git_commit
190
191 # Disables features that would allow repository owners to inject script into
192 # the gitweb domain.
193 our $prevent_xss = 0;
194
195 # Path to the highlight executable to use (must be the one from
196 # http://www.andre-simon.de due to assumptions about parameters and output).
197 # Useful if highlight is not installed on your webserver's PATH.
198 # [Default: highlight]
199 our $highlight_bin = "++HIGHLIGHT_BIN++";
200
201 # information about snapshot formats that gitweb is capable of serving
202 our %known_snapshot_formats = (
203 # name => {
204 # 'display' => display name,
205 # 'type' => mime type,
206 # 'suffix' => filename suffix,
207 # 'format' => --format for git-archive,
208 # 'compressor' => [compressor command and arguments]
209 # (array reference, optional)
210 # 'disabled' => boolean (optional)}
211 #
212 'tgz' => {
213 'display' => 'tar.gz',
214 'type' => 'application/x-gzip',
215 'suffix' => '.tar.gz',
216 'format' => 'tar',
217 'compressor' => ['gzip', '-n']},
218
219 'tbz2' => {
220 'display' => 'tar.bz2',
221 'type' => 'application/x-bzip2',
222 'suffix' => '.tar.bz2',
223 'format' => 'tar',
224 'compressor' => ['bzip2']},
225
226 'txz' => {
227 'display' => 'tar.xz',
228 'type' => 'application/x-xz',
229 'suffix' => '.tar.xz',
230 'format' => 'tar',
231 'compressor' => ['xz'],
232 'disabled' => 1},
233
234 'zip' => {
235 'display' => 'zip',
236 'type' => 'application/x-zip',
237 'suffix' => '.zip',
238 'format' => 'zip'},
239 );
240
241 # Aliases so we understand old gitweb.snapshot values in repository
242 # configuration.
243 our %known_snapshot_format_aliases = (
244 'gzip' => 'tgz',
245 'bzip2' => 'tbz2',
246 'xz' => 'txz',
247
248 # backward compatibility: legacy gitweb config support
249 'x-gzip' => undef, 'gz' => undef,
250 'x-bzip2' => undef, 'bz2' => undef,
251 'x-zip' => undef, '' => undef,
252 );
253
254 # Pixel sizes for icons and avatars. If the default font sizes or lineheights
255 # are changed, it may be appropriate to change these values too via
256 # $GITWEB_CONFIG.
257 our %avatar_size = (
258 'default' => 16,
259 'double' => 32
260 );
261
262 # Used to set the maximum load that we will still respond to gitweb queries.
263 # If server load exceed this value then return "503 server busy" error.
264 # If gitweb cannot determined server load, it is taken to be 0.
265 # Leave it undefined (or set to 'undef') to turn off load checking.
266 our $maxload = 300;
267
268 # configuration for 'highlight' (http://www.andre-simon.de/)
269 # match by basename
270 our %highlight_basename = (
271 #'Program' => 'py',
272 #'Library' => 'py',
273 'SConstruct' => 'py', # SCons equivalent of Makefile
274 'Makefile' => 'make',
275 );
276 # match by extension
277 our %highlight_ext = (
278 # main extensions, defining name of syntax;
279 # see files in /usr/share/highlight/langDefs/ directory
280 (map { $_ => $_ } qw(py rb java css js tex bib xml awk bat ini spec tcl sql)),
281 # alternate extensions, see /etc/highlight/filetypes.conf
282 (map { $_ => 'c' } qw(c h)),
283 (map { $_ => 'sh' } qw(sh bash zsh ksh)),
284 (map { $_ => 'cpp' } qw(cpp cxx c++ cc)),
285 (map { $_ => 'php' } qw(php php3 php4 php5 phps)),
286 (map { $_ => 'pl' } qw(pl perl pm)), # perhaps also 'cgi'
287 (map { $_ => 'make'} qw(make mak mk)),
288 (map { $_ => 'xml' } qw(xml xhtml html htm)),
289 );
290
291 # You define site-wide feature defaults here; override them with
292 # $GITWEB_CONFIG as necessary.
293 our %feature = (
294 # feature => {
295 # 'sub' => feature-sub (subroutine),
296 # 'override' => allow-override (boolean),
297 # 'default' => [ default options...] (array reference)}
298 #
299 # if feature is overridable (it means that allow-override has true value),
300 # then feature-sub will be called with default options as parameters;
301 # return value of feature-sub indicates if to enable specified feature
302 #
303 # if there is no 'sub' key (no feature-sub), then feature cannot be
304 # overridden
305 #
306 # use gitweb_get_feature(<feature>) to retrieve the <feature> value
307 # (an array) or gitweb_check_feature(<feature>) to check if <feature>
308 # is enabled
309
310 # Enable the 'blame' blob view, showing the last commit that modified
311 # each line in the file. This can be very CPU-intensive.
312
313 # To enable system wide have in $GITWEB_CONFIG
314 # $feature{'blame'}{'default'} = [1];
315 # To have project specific config enable override in $GITWEB_CONFIG
316 # $feature{'blame'}{'override'} = 1;
317 # and in project config gitweb.blame = 0|1;
318 'blame' => {
319 'sub' => sub { feature_bool('blame', @_) },
320 'override' => 0,
321 'default' => [0]},
322
323 # Enable the 'snapshot' link, providing a compressed archive of any
324 # tree. This can potentially generate high traffic if you have large
325 # project.
326
327 # Value is a list of formats defined in %known_snapshot_formats that
328 # you wish to offer.
329 # To disable system wide have in $GITWEB_CONFIG
330 # $feature{'snapshot'}{'default'} = [];
331 # To have project specific config enable override in $GITWEB_CONFIG
332 # $feature{'snapshot'}{'override'} = 1;
333 # and in project config, a comma-separated list of formats or "none"
334 # to disable. Example: gitweb.snapshot = tbz2,zip;
335 'snapshot' => {
336 'sub' => \&feature_snapshot,
337 'override' => 0,
338 'default' => ['tgz']},
339
340 # Enable text search, which will list the commits which match author,
341 # committer or commit text to a given string. Enabled by default.
342 # Project specific override is not supported.
343 #
344 # Note that this controls all search features, which means that if
345 # it is disabled, then 'grep' and 'pickaxe' search would also be
346 # disabled.
347 'search' => {
348 'override' => 0,
349 'default' => [1]},
350
351 # Enable grep search, which will list the files in currently selected
352 # tree containing the given string. Enabled by default. This can be
353 # potentially CPU-intensive, of course.
354 # Note that you need to have 'search' feature enabled too.
355
356 # To enable system wide have in $GITWEB_CONFIG
357 # $feature{'grep'}{'default'} = [1];
358 # To have project specific config enable override in $GITWEB_CONFIG
359 # $feature{'grep'}{'override'} = 1;
360 # and in project config gitweb.grep = 0|1;
361 'grep' => {
362 'sub' => sub { feature_bool('grep', @_) },
363 'override' => 0,
364 'default' => [1]},
365
366 # Enable the pickaxe search, which will list the commits that modified
367 # a given string in a file. This can be practical and quite faster
368 # alternative to 'blame', but still potentially CPU-intensive.
369 # Note that you need to have 'search' feature enabled too.
370
371 # To enable system wide have in $GITWEB_CONFIG
372 # $feature{'pickaxe'}{'default'} = [1];
373 # To have project specific config enable override in $GITWEB_CONFIG
374 # $feature{'pickaxe'}{'override'} = 1;
375 # and in project config gitweb.pickaxe = 0|1;
376 'pickaxe' => {
377 'sub' => sub { feature_bool('pickaxe', @_) },
378 'override' => 0,
379 'default' => [1]},
380
381 # Enable showing size of blobs in a 'tree' view, in a separate
382 # column, similar to what 'ls -l' does. This cost a bit of IO.
383
384 # To disable system wide have in $GITWEB_CONFIG
385 # $feature{'show-sizes'}{'default'} = [0];
386 # To have project specific config enable override in $GITWEB_CONFIG
387 # $feature{'show-sizes'}{'override'} = 1;
388 # and in project config gitweb.showsizes = 0|1;
389 'show-sizes' => {
390 'sub' => sub { feature_bool('showsizes', @_) },
391 'override' => 0,
392 'default' => [1]},
393
394 # Make gitweb use an alternative format of the URLs which can be
395 # more readable and natural-looking: project name is embedded
396 # directly in the path and the query string contains other
397 # auxiliary information. All gitweb installations recognize
398 # URL in either format; this configures in which formats gitweb
399 # generates links.
400
401 # To enable system wide have in $GITWEB_CONFIG
402 # $feature{'pathinfo'}{'default'} = [1];
403 # Project specific override is not supported.
404
405 # Note that you will need to change the default location of CSS,
406 # favicon, logo and possibly other files to an absolute URL. Also,
407 # if gitweb.cgi serves as your indexfile, you will need to force
408 # $my_uri to contain the script name in your $GITWEB_CONFIG.
409 'pathinfo' => {
410 'override' => 0,
411 'default' => [0]},
412
413 # Make gitweb consider projects in project root subdirectories
414 # to be forks of existing projects. Given project $projname.git,
415 # projects matching $projname/*.git will not be shown in the main
416 # projects list, instead a '+' mark will be added to $projname
417 # there and a 'forks' view will be enabled for the project, listing
418 # all the forks. If project list is taken from a file, forks have
419 # to be listed after the main project.
420
421 # To enable system wide have in $GITWEB_CONFIG
422 # $feature{'forks'}{'default'} = [1];
423 # Project specific override is not supported.
424 'forks' => {
425 'override' => 0,
426 'default' => [0]},
427
428 # Insert custom links to the action bar of all project pages.
429 # This enables you mainly to link to third-party scripts integrating
430 # into gitweb; e.g. git-browser for graphical history representation
431 # or custom web-based repository administration interface.
432
433 # The 'default' value consists of a list of triplets in the form
434 # (label, link, position) where position is the label after which
435 # to insert the link and link is a format string where %n expands
436 # to the project name, %f to the project path within the filesystem,
437 # %h to the current hash (h gitweb parameter) and %b to the current
438 # hash base (hb gitweb parameter); %% expands to %.
439
440 # To enable system wide have in $GITWEB_CONFIG e.g.
441 # $feature{'actions'}{'default'} = [('graphiclog',
442 # '/git-browser/by-commit.html?r=%n', 'summary')];
443 # Project specific override is not supported.
444 'actions' => {
445 'override' => 0,
446 'default' => []},
447
448 # Allow gitweb scan project content tags of project repository,
449 # and display the popular Web 2.0-ish "tag cloud" near the projects
450 # list. Note that this is something COMPLETELY different from the
451 # normal Git tags.
452
453 # gitweb by itself can show existing tags, but it does not handle
454 # tagging itself; you need to do it externally, outside gitweb.
455 # The format is described in git_get_project_ctags() subroutine.
456 # You may want to install the HTML::TagCloud Perl module to get
457 # a pretty tag cloud instead of just a list of tags.
458
459 # To enable system wide have in $GITWEB_CONFIG
460 # $feature{'ctags'}{'default'} = [1];
461 # Project specific override is not supported.
462
463 # In the future whether ctags editing is enabled might depend
464 # on the value, but using 1 should always mean no editing of ctags.
465 'ctags' => {
466 'override' => 0,
467 'default' => [0]},
468
469 # The maximum number of patches in a patchset generated in patch
470 # view. Set this to 0 or undef to disable patch view, or to a
471 # negative number to remove any limit.
472
473 # To disable system wide have in $GITWEB_CONFIG
474 # $feature{'patches'}{'default'} = [0];
475 # To have project specific config enable override in $GITWEB_CONFIG
476 # $feature{'patches'}{'override'} = 1;
477 # and in project config gitweb.patches = 0|n;
478 # where n is the maximum number of patches allowed in a patchset.
479 'patches' => {
480 'sub' => \&feature_patches,
481 'override' => 0,
482 'default' => [16]},
483
484 # Avatar support. When this feature is enabled, views such as
485 # shortlog or commit will display an avatar associated with
486 # the email of the committer(s) and/or author(s).
487
488 # Currently available providers are gravatar and picon.
489 # If an unknown provider is specified, the feature is disabled.
490
491 # Gravatar depends on Digest::MD5.
492 # Picon currently relies on the indiana.edu database.
493
494 # To enable system wide have in $GITWEB_CONFIG
495 # $feature{'avatar'}{'default'} = ['<provider>'];
496 # where <provider> is either gravatar or picon.
497 # To have project specific config enable override in $GITWEB_CONFIG
498 # $feature{'avatar'}{'override'} = 1;
499 # and in project config gitweb.avatar = <provider>;
500 'avatar' => {
501 'sub' => \&feature_avatar,
502 'override' => 0,
503 'default' => ['']},
504
505 # Enable displaying how much time and how many git commands
506 # it took to generate and display page. Disabled by default.
507 # Project specific override is not supported.
508 'timed' => {
509 'override' => 0,
510 'default' => [0]},
511
512 # Enable turning some links into links to actions which require
513 # JavaScript to run (like 'blame_incremental'). Not enabled by
514 # default. Project specific override is currently not supported.
515 'javascript-actions' => {
516 'override' => 0,
517 'default' => [0]},
518
519 # Enable and configure ability to change common timezone for dates
520 # in gitweb output via JavaScript. Enabled by default.
521 # Project specific override is not supported.
522 'javascript-timezone' => {
523 'override' => 0,
524 'default' => [
525 'local', # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
526 # or undef to turn off this feature
527 'gitweb_tz', # name of cookie where to store selected timezone
528 'datetime', # CSS class used to mark up dates for manipulation
529 ]},
530
531 # Syntax highlighting support. This is based on Daniel Svensson's
532 # and Sham Chukoury's work in gitweb-xmms2.git.
533 # It requires the 'highlight' program present in $PATH,
534 # and therefore is disabled by default.
535
536 # To enable system wide have in $GITWEB_CONFIG
537 # $feature{'highlight'}{'default'} = [1];
538
539 'highlight' => {
540 'sub' => sub { feature_bool('highlight', @_) },
541 'override' => 0,
542 'default' => [0]},
543
544 # Enable displaying of remote heads in the heads list
545
546 # To enable system wide have in $GITWEB_CONFIG
547 # $feature{'remote_heads'}{'default'} = [1];
548 # To have project specific config enable override in $GITWEB_CONFIG
549 # $feature{'remote_heads'}{'override'} = 1;
550 # and in project config gitweb.remoteheads = 0|1;
551 'remote_heads' => {
552 'sub' => sub { feature_bool('remote_heads', @_) },
553 'override' => 0,
554 'default' => [0]},
555
556 # Enable showing branches under other refs in addition to heads
557
558 # To set system wide extra branch refs have in $GITWEB_CONFIG
559 # $feature{'extra-branch-refs'}{'default'} = ['dirs', 'of', 'choice'];
560 # To have project specific config enable override in $GITWEB_CONFIG
561 # $feature{'extra-branch-refs'}{'override'} = 1;
562 # and in project config gitweb.extrabranchrefs = dirs of choice
563 # Every directory is separated with whitespace.
564
565 'extra-branch-refs' => {
566 'sub' => \&feature_extra_branch_refs,
567 'override' => 0,
568 'default' => []},
569 );
570
571 sub gitweb_get_feature {
572 my ($name) = @_;
573 return unless exists $feature{$name};
574 my ($sub, $override, @defaults) = (
575 $feature{$name}{'sub'},
576 $feature{$name}{'override'},
577 @{$feature{$name}{'default'}});
578 # project specific override is possible only if we have project
579 our $git_dir; # global variable, declared later
580 if (!$override || !defined $git_dir) {
581 return @defaults;
582 }
583 if (!defined $sub) {
584 warn "feature $name is not overridable";
585 return @defaults;
586 }
587 return $sub->(@defaults);
588 }
589
590 # A wrapper to check if a given feature is enabled.
591 # With this, you can say
592 #
593 # my $bool_feat = gitweb_check_feature('bool_feat');
594 # gitweb_check_feature('bool_feat') or somecode;
595 #
596 # instead of
597 #
598 # my ($bool_feat) = gitweb_get_feature('bool_feat');
599 # (gitweb_get_feature('bool_feat'))[0] or somecode;
600 #
601 sub gitweb_check_feature {
602 return (gitweb_get_feature(@_))[0];
603 }
604
605
606 sub feature_bool {
607 my $key = shift;
608 my ($val) = git_get_project_config($key, '--bool');
609
610 if (!defined $val) {
611 return ($_[0]);
612 } elsif ($val eq 'true') {
613 return (1);
614 } elsif ($val eq 'false') {
615 return (0);
616 }
617 }
618
619 sub feature_snapshot {
620 my (@fmts) = @_;
621
622 my ($val) = git_get_project_config('snapshot');
623
624 if ($val) {
625 @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
626 }
627
628 return @fmts;
629 }
630
631 sub feature_patches {
632 my @val = (git_get_project_config('patches', '--int'));
633
634 if (@val) {
635 return @val;
636 }
637
638 return ($_[0]);
639 }
640
641 sub feature_avatar {
642 my @val = (git_get_project_config('avatar'));
643
644 return @val ? @val : @_;
645 }
646
647 sub feature_extra_branch_refs {
648 my (@branch_refs) = @_;
649 my $values = git_get_project_config('extrabranchrefs');
650
651 if ($values) {
652 $values = config_to_multi ($values);
653 @branch_refs = ();
654 foreach my $value (@{$values}) {
655 push @branch_refs, split /\s+/, $value;
656 }
657 }
658
659 return @branch_refs;
660 }
661
662 # checking HEAD file with -e is fragile if the repository was
663 # initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
664 # and then pruned.
665 sub check_head_link {
666 my ($dir) = @_;
667 my $headfile = "$dir/HEAD";
668 return ((-e $headfile) ||
669 (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
670 }
671
672 sub check_export_ok {
673 my ($dir) = @_;
674 return (check_head_link($dir) &&
675 (!$export_ok || -e "$dir/$export_ok") &&
676 (!$export_auth_hook || $export_auth_hook->($dir)));
677 }
678
679 # process alternate names for backward compatibility
680 # filter out unsupported (unknown) snapshot formats
681 sub filter_snapshot_fmts {
682 my @fmts = @_;
683
684 @fmts = map {
685 exists $known_snapshot_format_aliases{$_} ?
686 $known_snapshot_format_aliases{$_} : $_} @fmts;
687 @fmts = grep {
688 exists $known_snapshot_formats{$_} &&
689 !$known_snapshot_formats{$_}{'disabled'}} @fmts;
690 }
691
692 sub filter_and_validate_refs {
693 my @refs = @_;
694 my %unique_refs = ();
695
696 foreach my $ref (@refs) {
697 die_error(500, "Invalid ref '$ref' in 'extra-branch-refs' feature") unless (is_valid_ref_format($ref));
698 # 'heads' are added implicitly in get_branch_refs().
699 $unique_refs{$ref} = 1 if ($ref ne 'heads');
700 }
701 return sort keys %unique_refs;
702 }
703
704 # If it is set to code reference, it is code that it is to be run once per
705 # request, allowing updating configurations that change with each request,
706 # while running other code in config file only once.
707 #
708 # Otherwise, if it is false then gitweb would process config file only once;
709 # if it is true then gitweb config would be run for each request.
710 our $per_request_config = 1;
711
712 # read and parse gitweb config file given by its parameter.
713 # returns true on success, false on recoverable error, allowing
714 # to chain this subroutine, using first file that exists.
715 # dies on errors during parsing config file, as it is unrecoverable.
716 sub read_config_file {
717 my $filename = shift;
718 return unless defined $filename;
719 # die if there are errors parsing config file
720 if (-e $filename) {
721 do $filename;
722 die $@ if $@;
723 return 1;
724 }
725 return;
726 }
727
728 our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
729 sub evaluate_gitweb_config {
730 our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
731 our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
732 our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
733
734 # Protect against duplications of file names, to not read config twice.
735 # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
736 # there possibility of duplication of filename there doesn't matter.
737 $GITWEB_CONFIG = "" if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
738 $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
739
740 # Common system-wide settings for convenience.
741 # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
742 read_config_file($GITWEB_CONFIG_COMMON);
743
744 # Use first config file that exists. This means use the per-instance
745 # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
746 read_config_file($GITWEB_CONFIG) and return;
747 read_config_file($GITWEB_CONFIG_SYSTEM);
748 }
749
750 # Get loadavg of system, to compare against $maxload.
751 # Currently it requires '/proc/loadavg' present to get loadavg;
752 # if it is not present it returns 0, which means no load checking.
753 sub get_loadavg {
754 if( -e '/proc/loadavg' ){
755 open my $fd, '<', '/proc/loadavg'
756 or return 0;
757 my @load = split(/\s+/, scalar <$fd>);
758 close $fd;
759
760 # The first three columns measure CPU and IO utilization of the last one,
761 # five, and 10 minute periods. The fourth column shows the number of
762 # currently running processes and the total number of processes in the m/n
763 # format. The last column displays the last process ID used.
764 return $load[0] || 0;
765 }
766 # additional checks for load average should go here for things that don't export
767 # /proc/loadavg
768
769 return 0;
770 }
771
772 # version of the core git binary
773 our $git_version;
774 sub evaluate_git_version {
775 our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
776 $number_of_git_cmds++;
777 }
778
779 sub check_loadavg {
780 if (defined $maxload && get_loadavg() > $maxload) {
781 die_error(503, "The load average on the server is too high");
782 }
783 }
784
785 # ======================================================================
786 # input validation and dispatch
787
788 # input parameters can be collected from a variety of sources (presently, CGI
789 # and PATH_INFO), so we define an %input_params hash that collects them all
790 # together during validation: this allows subsequent uses (e.g. href()) to be
791 # agnostic of the parameter origin
792
793 our %input_params = ();
794
795 # input parameters are stored with the long parameter name as key. This will
796 # also be used in the href subroutine to convert parameters to their CGI
797 # equivalent, and since the href() usage is the most frequent one, we store
798 # the name -> CGI key mapping here, instead of the reverse.
799 #
800 # XXX: Warning: If you touch this, check the search form for updating,
801 # too.
802
803 our @cgi_param_mapping = (
804 project => "p",
805 action => "a",
806 file_name => "f",
807 file_parent => "fp",
808 hash => "h",
809 hash_parent => "hp",
810 hash_base => "hb",
811 hash_parent_base => "hpb",
812 page => "pg",
813 order => "o",
814 searchtext => "s",
815 searchtype => "st",
816 snapshot_format => "sf",
817 extra_options => "opt",
818 search_use_regexp => "sr",
819 ctag => "by_tag",
820 diff_style => "ds",
821 project_filter => "pf",
822 # this must be last entry (for manipulation from JavaScript)
823 javascript => "js"
824 );
825 our %cgi_param_mapping = @cgi_param_mapping;
826
827 # we will also need to know the possible actions, for validation
828 our %actions = (
829 "blame" => \&git_blame,
830 "blame_incremental" => \&git_blame_incremental,
831 "blame_data" => \&git_blame_data,
832 "blobdiff" => \&git_blobdiff,
833 "blobdiff_plain" => \&git_blobdiff_plain,
834 "blob" => \&git_blob,
835 "blob_plain" => \&git_blob_plain,
836 "commitdiff" => \&git_commitdiff,
837 "commitdiff_plain" => \&git_commitdiff_plain,
838 "commit" => \&git_commit,
839 "forks" => \&git_forks,
840 "heads" => \&git_heads,
841 "history" => \&git_history,
842 "log" => \&git_log,
843 "patch" => \&git_patch,
844 "patches" => \&git_patches,
845 "remotes" => \&git_remotes,
846 "rss" => \&git_rss,
847 "atom" => \&git_atom,
848 "search" => \&git_search,
849 "search_help" => \&git_search_help,
850 "shortlog" => \&git_shortlog,
851 "summary" => \&git_summary,
852 "tag" => \&git_tag,
853 "tags" => \&git_tags,
854 "tree" => \&git_tree,
855 "snapshot" => \&git_snapshot,
856 "object" => \&git_object,
857 # those below don't need $project
858 "opml" => \&git_opml,
859 "project_list" => \&git_project_list,
860 "project_index" => \&git_project_index,
861 );
862
863 # finally, we have the hash of allowed extra_options for the commands that
864 # allow them
865 our %allowed_options = (
866 "--no-merges" => [ qw(rss atom log shortlog history) ],
867 );
868
869 # fill %input_params with the CGI parameters. All values except for 'opt'
870 # should be single values, but opt can be an array. We should probably
871 # build an array of parameters that can be multi-valued, but since for the time
872 # being it's only this one, we just single it out
873 sub evaluate_query_params {
874 our $cgi;
875
876 while (my ($name, $symbol) = each %cgi_param_mapping) {
877 if ($symbol eq 'opt') {
878 $input_params{$name} = [ map { decode_utf8($_) } $cgi->multi_param($symbol) ];
879 } else {
880 $input_params{$name} = decode_utf8($cgi->param($symbol));
881 }
882 }
883 }
884
885 # now read PATH_INFO and update the parameter list for missing parameters
886 sub evaluate_path_info {
887 return if defined $input_params{'project'};
888 return if !$path_info;
889 $path_info =~ s,^/+,,;
890 return if !$path_info;
891
892 # find which part of PATH_INFO is project
893 my $project = $path_info;
894 $project =~ s,/+$,,;
895 while ($project && !check_head_link("$projectroot/$project")) {
896 $project =~ s,/*[^/]*$,,;
897 }
898 return unless $project;
899 $input_params{'project'} = $project;
900
901 # do not change any parameters if an action is given using the query string
902 return if $input_params{'action'};
903 $path_info =~ s,^\Q$project\E/*,,;
904
905 # next, check if we have an action
906 my $action = $path_info;
907 $action =~ s,/.*$,,;
908 if (exists $actions{$action}) {
909 $path_info =~ s,^$action/*,,;
910 $input_params{'action'} = $action;
911 }
912
913 # list of actions that want hash_base instead of hash, but can have no
914 # pathname (f) parameter
915 my @wants_base = (
916 'tree',
917 'history',
918 );
919
920 # we want to catch, among others
921 # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
922 my ($parentrefname, $parentpathname, $refname, $pathname) =
923 ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
924
925 # first, analyze the 'current' part
926 if (defined $pathname) {
927 # we got "branch:filename" or "branch:dir/"
928 # we could use git_get_type(branch:pathname), but:
929 # - it needs $git_dir
930 # - it does a git() call
931 # - the convention of terminating directories with a slash
932 # makes it superfluous
933 # - embedding the action in the PATH_INFO would make it even
934 # more superfluous
935 $pathname =~ s,^/+,,;
936 if (!$pathname || substr($pathname, -1) eq "/") {
937 $input_params{'action'} ||= "tree";
938 $pathname =~ s,/$,,;
939 } else {
940 # the default action depends on whether we had parent info
941 # or not
942 if ($parentrefname) {
943 $input_params{'action'} ||= "blobdiff_plain";
944 } else {
945 $input_params{'action'} ||= "blob_plain";
946 }
947 }
948 $input_params{'hash_base'} ||= $refname;
949 $input_params{'file_name'} ||= $pathname;
950 } elsif (defined $refname) {
951 # we got "branch". In this case we have to choose if we have to
952 # set hash or hash_base.
953 #
954 # Most of the actions without a pathname only want hash to be
955 # set, except for the ones specified in @wants_base that want
956 # hash_base instead. It should also be noted that hand-crafted
957 # links having 'history' as an action and no pathname or hash
958 # set will fail, but that happens regardless of PATH_INFO.
959 if (defined $parentrefname) {
960 # if there is parent let the default be 'shortlog' action
961 # (for http://git.example.com/repo.git/A..B links); if there
962 # is no parent, dispatch will detect type of object and set
963 # action appropriately if required (if action is not set)
964 $input_params{'action'} ||= "shortlog";
965 }
966 if ($input_params{'action'} &&
967 grep { $_ eq $input_params{'action'} } @wants_base) {
968 $input_params{'hash_base'} ||= $refname;
969 } else {
970 $input_params{'hash'} ||= $refname;
971 }
972 }
973
974 # next, handle the 'parent' part, if present
975 if (defined $parentrefname) {
976 # a missing pathspec defaults to the 'current' filename, allowing e.g.
977 # someproject/blobdiff/oldrev..newrev:/filename
978 if ($parentpathname) {
979 $parentpathname =~ s,^/+,,;
980 $parentpathname =~ s,/$,,;
981 $input_params{'file_parent'} ||= $parentpathname;
982 } else {
983 $input_params{'file_parent'} ||= $input_params{'file_name'};
984 }
985 # we assume that hash_parent_base is wanted if a path was specified,
986 # or if the action wants hash_base instead of hash
987 if (defined $input_params{'file_parent'} ||
988 grep { $_ eq $input_params{'action'} } @wants_base) {
989 $input_params{'hash_parent_base'} ||= $parentrefname;
990 } else {
991 $input_params{'hash_parent'} ||= $parentrefname;
992 }
993 }
994
995 # for the snapshot action, we allow URLs in the form
996 # $project/snapshot/$hash.ext
997 # where .ext determines the snapshot and gets removed from the
998 # passed $refname to provide the $hash.
999 #
1000 # To be able to tell that $refname includes the format extension, we
1001 # require the following two conditions to be satisfied:
1002 # - the hash input parameter MUST have been set from the $refname part
1003 # of the URL (i.e. they must be equal)
1004 # - the snapshot format MUST NOT have been defined already (e.g. from
1005 # CGI parameter sf)
1006 # It's also useless to try any matching unless $refname has a dot,
1007 # so we check for that too
1008 if (defined $input_params{'action'} &&
1009 $input_params{'action'} eq 'snapshot' &&
1010 defined $refname && index($refname, '.') != -1 &&
1011 $refname eq $input_params{'hash'} &&
1012 !defined $input_params{'snapshot_format'}) {
1013 # We loop over the known snapshot formats, checking for
1014 # extensions. Allowed extensions are both the defined suffix
1015 # (which includes the initial dot already) and the snapshot
1016 # format key itself, with a prepended dot
1017 while (my ($fmt, $opt) = each %known_snapshot_formats) {
1018 my $hash = $refname;
1019 unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
1020 next;
1021 }
1022 my $sfx = $1;
1023 # a valid suffix was found, so set the snapshot format
1024 # and reset the hash parameter
1025 $input_params{'snapshot_format'} = $fmt;
1026 $input_params{'hash'} = $hash;
1027 # we also set the format suffix to the one requested
1028 # in the URL: this way a request for e.g. .tgz returns
1029 # a .tgz instead of a .tar.gz
1030 $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
1031 last;
1032 }
1033 }
1034 }
1035
1036 our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
1037 $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
1038 $searchtext, $search_regexp, $project_filter);
1039 sub evaluate_and_validate_params {
1040 our $action = $input_params{'action'};
1041 if (defined $action) {
1042 if (!is_valid_action($action)) {
1043 die_error(400, "Invalid action parameter");
1044 }
1045 }
1046
1047 # parameters which are pathnames
1048 our $project = $input_params{'project'};
1049 if (defined $project) {
1050 if (!is_valid_project($project)) {
1051 undef $project;
1052 die_error(404, "No such project");
1053 }
1054 }
1055
1056 our $project_filter = $input_params{'project_filter'};
1057 if (defined $project_filter) {
1058 if (!is_valid_pathname($project_filter)) {
1059 die_error(404, "Invalid project_filter parameter");
1060 }
1061 }
1062
1063 our $file_name = $input_params{'file_name'};
1064 if (defined $file_name) {
1065 if (!is_valid_pathname($file_name)) {
1066 die_error(400, "Invalid file parameter");
1067 }
1068 }
1069
1070 our $file_parent = $input_params{'file_parent'};
1071 if (defined $file_parent) {
1072 if (!is_valid_pathname($file_parent)) {
1073 die_error(400, "Invalid file parent parameter");
1074 }
1075 }
1076
1077 # parameters which are refnames
1078 our $hash = $input_params{'hash'};
1079 if (defined $hash) {
1080 if (!is_valid_refname($hash)) {
1081 die_error(400, "Invalid hash parameter");
1082 }
1083 }
1084
1085 our $hash_parent = $input_params{'hash_parent'};
1086 if (defined $hash_parent) {
1087 if (!is_valid_refname($hash_parent)) {
1088 die_error(400, "Invalid hash parent parameter");
1089 }
1090 }
1091
1092 our $hash_base = $input_params{'hash_base'};
1093 if (defined $hash_base) {
1094 if (!is_valid_refname($hash_base)) {
1095 die_error(400, "Invalid hash base parameter");
1096 }
1097 }
1098
1099 our @extra_options = @{$input_params{'extra_options'}};
1100 # @extra_options is always defined, since it can only be (currently) set from
1101 # CGI, and $cgi->param() returns the empty array in array context if the param
1102 # is not set
1103 foreach my $opt (@extra_options) {
1104 if (not exists $allowed_options{$opt}) {
1105 die_error(400, "Invalid option parameter");
1106 }
1107 if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1108 die_error(400, "Invalid option parameter for this action");
1109 }
1110 }
1111
1112 our $hash_parent_base = $input_params{'hash_parent_base'};
1113 if (defined $hash_parent_base) {
1114 if (!is_valid_refname($hash_parent_base)) {
1115 die_error(400, "Invalid hash parent base parameter");
1116 }
1117 }
1118
1119 # other parameters
1120 our $page = $input_params{'page'};
1121 if (defined $page) {
1122 if ($page =~ m/[^0-9]/) {
1123 die_error(400, "Invalid page parameter");
1124 }
1125 }
1126
1127 our $searchtype = $input_params{'searchtype'};
1128 if (defined $searchtype) {
1129 if ($searchtype =~ m/[^a-z]/) {
1130 die_error(400, "Invalid searchtype parameter");
1131 }
1132 }
1133
1134 our $search_use_regexp = $input_params{'search_use_regexp'};
1135
1136 our $searchtext = $input_params{'searchtext'};
1137 our $search_regexp = undef;
1138 if (defined $searchtext) {
1139 if (length($searchtext) < 2) {
1140 die_error(403, "At least two characters are required for search parameter");
1141 }
1142 if ($search_use_regexp) {
1143 $search_regexp = $searchtext;
1144 if (!eval { qr/$search_regexp/; 1; }) {
1145 (my $error = $@) =~ s/ at \S+ line \d+.*\n?//;
1146 die_error(400, "Invalid search regexp '$search_regexp'",
1147 esc_html($error));
1148 }
1149 } else {
1150 $search_regexp = quotemeta $searchtext;
1151 }
1152 }
1153 }
1154
1155 # path to the current git repository
1156 our $git_dir;
1157 sub evaluate_git_dir {
1158 our $git_dir = "$projectroot/$project" if $project;
1159 }
1160
1161 our (@snapshot_fmts, $git_avatar, @extra_branch_refs);
1162 sub configure_gitweb_features {
1163 # list of supported snapshot formats
1164 our @snapshot_fmts = gitweb_get_feature('snapshot');
1165 @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1166
1167 # check that the avatar feature is set to a known provider name,
1168 # and for each provider check if the dependencies are satisfied.
1169 # if the provider name is invalid or the dependencies are not met,
1170 # reset $git_avatar to the empty string.
1171 our ($git_avatar) = gitweb_get_feature('avatar');
1172 if ($git_avatar eq 'gravatar') {
1173 $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1174 } elsif ($git_avatar eq 'picon') {
1175 # no dependencies
1176 } else {
1177 $git_avatar = '';
1178 }
1179
1180 our @extra_branch_refs = gitweb_get_feature('extra-branch-refs');
1181 @extra_branch_refs = filter_and_validate_refs (@extra_branch_refs);
1182 }
1183
1184 sub get_branch_refs {
1185 return ('heads', @extra_branch_refs);
1186 }
1187
1188 # custom error handler: 'die <message>' is Internal Server Error
1189 sub handle_errors_html {
1190 my $msg = shift; # it is already HTML escaped
1191
1192 # to avoid infinite loop where error occurs in die_error,
1193 # change handler to default handler, disabling handle_errors_html
1194 set_message("Error occurred when inside die_error:\n$msg");
1195
1196 # you cannot jump out of die_error when called as error handler;
1197 # the subroutine set via CGI::Carp::set_message is called _after_
1198 # HTTP headers are already written, so it cannot write them itself
1199 die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1200 }
1201 set_message(\&handle_errors_html);
1202
1203 # dispatch
1204 sub dispatch {
1205 if (!defined $action) {
1206 if (defined $hash) {
1207 $action = git_get_type($hash);
1208 $action or die_error(404, "Object does not exist");
1209 } elsif (defined $hash_base && defined $file_name) {
1210 $action = git_get_type("$hash_base:$file_name");
1211 $action or die_error(404, "File or directory does not exist");
1212 } elsif (defined $project) {
1213 $action = 'summary';
1214 } else {
1215 $action = 'project_list';
1216 }
1217 }
1218 if (!defined($actions{$action})) {
1219 die_error(400, "Unknown action");
1220 }
1221 if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1222 !$project) {
1223 die_error(400, "Project needed");
1224 }
1225 $actions{$action}->();
1226 }
1227
1228 sub reset_timer {
1229 our $t0 = [ gettimeofday() ]
1230 if defined $t0;
1231 our $number_of_git_cmds = 0;
1232 }
1233
1234 our $first_request = 1;
1235 sub run_request {
1236 reset_timer();
1237
1238 evaluate_uri();
1239 if ($first_request) {
1240 evaluate_gitweb_config();
1241 evaluate_git_version();
1242 }
1243 if ($per_request_config) {
1244 if (ref($per_request_config) eq 'CODE') {
1245 $per_request_config->();
1246 } elsif (!$first_request) {
1247 evaluate_gitweb_config();
1248 }
1249 }
1250 check_loadavg();
1251
1252 # $projectroot and $projects_list might be set in gitweb config file
1253 $projects_list ||= $projectroot;
1254
1255 evaluate_query_params();
1256 evaluate_path_info();
1257 evaluate_and_validate_params();
1258 evaluate_git_dir();
1259
1260 configure_gitweb_features();
1261
1262 dispatch();
1263 }
1264
1265 our $is_last_request = sub { 1 };
1266 our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1267 our $CGI = 'CGI';
1268 our $cgi;
1269 sub configure_as_fcgi {
1270 require CGI::Fast;
1271 our $CGI = 'CGI::Fast';
1272
1273 my $request_number = 0;
1274 # let each child service 100 requests
1275 our $is_last_request = sub { ++$request_number > 100 };
1276 }
1277 sub evaluate_argv {
1278 my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1279 configure_as_fcgi()
1280 if $script_name =~ /\.fcgi$/;
1281
1282 return unless (@ARGV);
1283
1284 require Getopt::Long;
1285 Getopt::Long::GetOptions(
1286 'fastcgi|fcgi|f' => \&configure_as_fcgi,
1287 'nproc|n=i' => sub {
1288 my ($arg, $val) = @_;
1289 return unless eval { require FCGI::ProcManager; 1; };
1290 my $proc_manager = FCGI::ProcManager->new({
1291 n_processes => $val,
1292 });
1293 our $pre_listen_hook = sub { $proc_manager->pm_manage() };
1294 our $pre_dispatch_hook = sub { $proc_manager->pm_pre_dispatch() };
1295 our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1296 },
1297 );
1298 }
1299
1300 sub run {
1301 evaluate_argv();
1302
1303 $first_request = 1;
1304 $pre_listen_hook->()
1305 if $pre_listen_hook;
1306
1307 REQUEST:
1308 while ($cgi = $CGI->new()) {
1309 $pre_dispatch_hook->()
1310 if $pre_dispatch_hook;
1311
1312 run_request();
1313
1314 $post_dispatch_hook->()
1315 if $post_dispatch_hook;
1316 $first_request = 0;
1317
1318 last REQUEST if ($is_last_request->());
1319 }
1320
1321 DONE_GITWEB:
1322 1;
1323 }
1324
1325 run();
1326
1327 if (defined caller) {
1328 # wrapped in a subroutine processing requests,
1329 # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1330 return;
1331 } else {
1332 # pure CGI script, serving single request
1333 exit;
1334 }
1335
1336 ## ======================================================================
1337 ## action links
1338
1339 # possible values of extra options
1340 # -full => 0|1 - use absolute/full URL ($my_uri/$my_url as base)
1341 # -replay => 1 - start from a current view (replay with modifications)
1342 # -path_info => 0|1 - don't use/use path_info URL (if possible)
1343 # -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1344 sub href {
1345 my %params = @_;
1346 # default is to use -absolute url() i.e. $my_uri
1347 my $href = $params{-full} ? $my_url : $my_uri;
1348
1349 # implicit -replay, must be first of implicit params
1350 $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1351
1352 $params{'project'} = $project unless exists $params{'project'};
1353
1354 if ($params{-replay}) {
1355 while (my ($name, $symbol) = each %cgi_param_mapping) {
1356 if (!exists $params{$name}) {
1357 $params{$name} = $input_params{$name};
1358 }
1359 }
1360 }
1361
1362 my $use_pathinfo = gitweb_check_feature('pathinfo');
1363 if (defined $params{'project'} &&
1364 (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1365 # try to put as many parameters as possible in PATH_INFO:
1366 # - project name
1367 # - action
1368 # - hash_parent or hash_parent_base:/file_parent
1369 # - hash or hash_base:/filename
1370 # - the snapshot_format as an appropriate suffix
1371
1372 # When the script is the root DirectoryIndex for the domain,
1373 # $href here would be something like http://gitweb.example.com/
1374 # Thus, we strip any trailing / from $href, to spare us double
1375 # slashes in the final URL
1376 $href =~ s,/$,,;
1377
1378 # Then add the project name, if present
1379 $href .= "/".esc_path_info($params{'project'});
1380 delete $params{'project'};
1381
1382 # since we destructively absorb parameters, we keep this
1383 # boolean that remembers if we're handling a snapshot
1384 my $is_snapshot = $params{'action'} eq 'snapshot';
1385
1386 # Summary just uses the project path URL, any other action is
1387 # added to the URL
1388 if (defined $params{'action'}) {
1389 $href .= "/".esc_path_info($params{'action'})
1390 unless $params{'action'} eq 'summary';
1391 delete $params{'action'};
1392 }
1393
1394 # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1395 # stripping nonexistent or useless pieces
1396 $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1397 || $params{'hash_parent'} || $params{'hash'});
1398 if (defined $params{'hash_base'}) {
1399 if (defined $params{'hash_parent_base'}) {
1400 $href .= esc_path_info($params{'hash_parent_base'});
1401 # skip the file_parent if it's the same as the file_name
1402 if (defined $params{'file_parent'}) {
1403 if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1404 delete $params{'file_parent'};
1405 } elsif ($params{'file_parent'} !~ /\.\./) {
1406 $href .= ":/".esc_path_info($params{'file_parent'});
1407 delete $params{'file_parent'};
1408 }
1409 }
1410 $href .= "..";
1411 delete $params{'hash_parent'};
1412 delete $params{'hash_parent_base'};
1413 } elsif (defined $params{'hash_parent'}) {
1414 $href .= esc_path_info($params{'hash_parent'}). "..";
1415 delete $params{'hash_parent'};
1416 }
1417
1418 $href .= esc_path_info($params{'hash_base'});
1419 if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1420 $href .= ":/".esc_path_info($params{'file_name'});
1421 delete $params{'file_name'};
1422 }
1423 delete $params{'hash'};
1424 delete $params{'hash_base'};
1425 } elsif (defined $params{'hash'}) {
1426 $href .= esc_path_info($params{'hash'});
1427 delete $params{'hash'};
1428 }
1429
1430 # If the action was a snapshot, we can absorb the
1431 # snapshot_format parameter too
1432 if ($is_snapshot) {
1433 my $fmt = $params{'snapshot_format'};
1434 # snapshot_format should always be defined when href()
1435 # is called, but just in case some code forgets, we
1436 # fall back to the default
1437 $fmt ||= $snapshot_fmts[0];
1438 $href .= $known_snapshot_formats{$fmt}{'suffix'};
1439 delete $params{'snapshot_format'};
1440 }
1441 }
1442
1443 # now encode the parameters explicitly
1444 my @result = ();
1445 for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1446 my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1447 if (defined $params{$name}) {
1448 if (ref($params{$name}) eq "ARRAY") {
1449 foreach my $par (@{$params{$name}}) {
1450 push @result, $symbol . "=" . esc_param($par);
1451 }
1452 } else {
1453 push @result, $symbol . "=" . esc_param($params{$name});
1454 }
1455 }
1456 }
1457 $href .= "?" . join(';', @result) if scalar @result;
1458
1459 # final transformation: trailing spaces must be escaped (URI-encoded)
1460 $href =~ s/(\s+)$/CGI::escape($1)/e;
1461
1462 if ($params{-anchor}) {
1463 $href .= "#".esc_param($params{-anchor});
1464 }
1465
1466 return $href;
1467 }
1468
1469
1470 ## ======================================================================
1471 ## validation, quoting/unquoting and escaping
1472
1473 sub is_valid_action {
1474 my $input = shift;
1475 return undef unless exists $actions{$input};
1476 return 1;
1477 }
1478
1479 sub is_valid_project {
1480 my $input = shift;
1481
1482 return unless defined $input;
1483 if (!is_valid_pathname($input) ||
1484 !(-d "$projectroot/$input") ||
1485 !check_export_ok("$projectroot/$input") ||
1486 ($strict_export && !project_in_list($input))) {
1487 return undef;
1488 } else {
1489 return 1;
1490 }
1491 }
1492
1493 sub is_valid_pathname {
1494 my $input = shift;
1495
1496 return undef unless defined $input;
1497 # no '.' or '..' as elements of path, i.e. no '.' or '..'
1498 # at the beginning, at the end, and between slashes.
1499 # also this catches doubled slashes
1500 if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1501 return undef;
1502 }
1503 # no null characters
1504 if ($input =~ m!\0!) {
1505 return undef;
1506 }
1507 return 1;
1508 }
1509
1510 sub is_valid_ref_format {
1511 my $input = shift;
1512
1513 return undef unless defined $input;
1514 # restrictions on ref name according to git-check-ref-format
1515 if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1516 return undef;
1517 }
1518 return 1;
1519 }
1520
1521 sub is_valid_refname {
1522 my $input = shift;
1523
1524 return undef unless defined $input;
1525 # textual hashes are O.K.
1526 if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1527 return 1;
1528 }
1529 # it must be correct pathname
1530 is_valid_pathname($input) or return undef;
1531 # check git-check-ref-format restrictions
1532 is_valid_ref_format($input) or return undef;
1533 return 1;
1534 }
1535
1536 # decode sequences of octets in utf8 into Perl's internal form,
1537 # which is utf-8 with utf8 flag set if needed. gitweb writes out
1538 # in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1539 sub to_utf8 {
1540 my $str = shift;
1541 return undef unless defined $str;
1542
1543 if (utf8::is_utf8($str) || utf8::decode($str)) {
1544 return $str;
1545 } else {
1546 return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1547 }
1548 }
1549
1550 # quote unsafe chars, but keep the slash, even when it's not
1551 # correct, but quoted slashes look too horrible in bookmarks
1552 sub esc_param {
1553 my $str = shift;
1554 return undef unless defined $str;
1555 $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1556 $str =~ s/ /\+/g;
1557 return $str;
1558 }
1559
1560 # the quoting rules for path_info fragment are slightly different
1561 sub esc_path_info {
1562 my $str = shift;
1563 return undef unless defined $str;
1564
1565 # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1566 $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1567
1568 return $str;
1569 }
1570
1571 # quote unsafe chars in whole URL, so some characters cannot be quoted
1572 sub esc_url {
1573 my $str = shift;
1574 return undef unless defined $str;
1575 $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1576 $str =~ s/ /\+/g;
1577 return $str;
1578 }
1579
1580 # quote unsafe characters in HTML attributes
1581 sub esc_attr {
1582
1583 # for XHTML conformance escaping '"' to '&quot;' is not enough
1584 return esc_html(@_);
1585 }
1586
1587 # replace invalid utf8 character with SUBSTITUTION sequence
1588 sub esc_html {
1589 my $str = shift;
1590 my %opts = @_;
1591
1592 return undef unless defined $str;
1593
1594 $str = to_utf8($str);
1595 $str = $cgi->escapeHTML($str);
1596 if ($opts{'-nbsp'}) {
1597 $str =~ s/ /&nbsp;/g;
1598 }
1599 $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1600 return $str;
1601 }
1602
1603 # quote control characters and escape filename to HTML
1604 sub esc_path {
1605 my $str = shift;
1606 my %opts = @_;
1607
1608 return undef unless defined $str;
1609
1610 $str = to_utf8($str);
1611 $str = $cgi->escapeHTML($str);
1612 if ($opts{'-nbsp'}) {
1613 $str =~ s/ /&nbsp;/g;
1614 }
1615 $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1616 return $str;
1617 }
1618
1619 # Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1620 sub sanitize {
1621 my $str = shift;
1622
1623 return undef unless defined $str;
1624
1625 $str = to_utf8($str);
1626 $str =~ s|([[:cntrl:]])|(index("\t\n\r", $1) != -1 ? $1 : quot_cec($1))|eg;
1627 return $str;
1628 }
1629
1630 # Make control characters "printable", using character escape codes (CEC)
1631 sub quot_cec {
1632 my $cntrl = shift;
1633 my %opts = @_;
1634 my %es = ( # character escape codes, aka escape sequences
1635 "\t" => '\t', # tab (HT)
1636 "\n" => '\n', # line feed (LF)
1637 "\r" => '\r', # carrige return (CR)
1638 "\f" => '\f', # form feed (FF)
1639 "\b" => '\b', # backspace (BS)
1640 "\a" => '\a', # alarm (bell) (BEL)
1641 "\e" => '\e', # escape (ESC)
1642 "\013" => '\v', # vertical tab (VT)
1643 "\000" => '\0', # nul character (NUL)
1644 );
1645 my $chr = ( (exists $es{$cntrl})
1646 ? $es{$cntrl}
1647 : sprintf('\%2x', ord($cntrl)) );
1648 if ($opts{-nohtml}) {
1649 return $chr;
1650 } else {
1651 return "<span class=\"cntrl\">$chr</span>";
1652 }
1653 }
1654
1655 # Alternatively use unicode control pictures codepoints,
1656 # Unicode "printable representation" (PR)
1657 sub quot_upr {
1658 my $cntrl = shift;
1659 my %opts = @_;
1660
1661 my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1662 if ($opts{-nohtml}) {
1663 return $chr;
1664 } else {
1665 return "<span class=\"cntrl\">$chr</span>";
1666 }
1667 }
1668
1669 # git may return quoted and escaped filenames
1670 sub unquote {
1671 my $str = shift;
1672
1673 sub unq {
1674 my $seq = shift;
1675 my %es = ( # character escape codes, aka escape sequences
1676 't' => "\t", # tab (HT, TAB)
1677 'n' => "\n", # newline (NL)
1678 'r' => "\r", # return (CR)
1679 'f' => "\f", # form feed (FF)
1680 'b' => "\b", # backspace (BS)
1681 'a' => "\a", # alarm (bell) (BEL)
1682 'e' => "\e", # escape (ESC)
1683 'v' => "\013", # vertical tab (VT)
1684 );
1685
1686 if ($seq =~ m/^[0-7]{1,3}$/) {
1687 # octal char sequence
1688 return chr(oct($seq));
1689 } elsif (exists $es{$seq}) {
1690 # C escape sequence, aka character escape code
1691 return $es{$seq};
1692 }
1693 # quoted ordinary character
1694 return $seq;
1695 }
1696
1697 if ($str =~ m/^"(.*)"$/) {
1698 # needs unquoting
1699 $str = $1;
1700 $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1701 }
1702 return $str;
1703 }
1704
1705 # escape tabs (convert tabs to spaces)
1706 sub untabify {
1707 my $line = shift;
1708
1709 while ((my $pos = index($line, "\t")) != -1) {
1710 if (my $count = (8 - ($pos % 8))) {
1711 my $spaces = ' ' x $count;
1712 $line =~ s/\t/$spaces/;
1713 }
1714 }
1715
1716 return $line;
1717 }
1718
1719 sub project_in_list {
1720 my $project = shift;
1721 my @list = git_get_projects_list();
1722 return @list && scalar(grep { $_->{'path'} eq $project } @list);
1723 }
1724
1725 ## ----------------------------------------------------------------------
1726 ## HTML aware string manipulation
1727
1728 # Try to chop given string on a word boundary between position
1729 # $len and $len+$add_len. If there is no word boundary there,
1730 # chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1731 # (marking chopped part) would be longer than given string.
1732 sub chop_str {
1733 my $str = shift;
1734 my $len = shift;
1735 my $add_len = shift || 10;
1736 my $where = shift || 'right'; # 'left' | 'center' | 'right'
1737
1738 # Make sure perl knows it is utf8 encoded so we don't
1739 # cut in the middle of a utf8 multibyte char.
1740 $str = to_utf8($str);
1741
1742 # allow only $len chars, but don't cut a word if it would fit in $add_len
1743 # if it doesn't fit, cut it if it's still longer than the dots we would add
1744 # remove chopped character entities entirely
1745
1746 # when chopping in the middle, distribute $len into left and right part
1747 # return early if chopping wouldn't make string shorter
1748 if ($where eq 'center') {
1749 return $str if ($len + 5 >= length($str)); # filler is length 5
1750 $len = int($len/2);
1751 } else {
1752 return $str if ($len + 4 >= length($str)); # filler is length 4
1753 }
1754
1755 # regexps: ending and beginning with word part up to $add_len
1756 my $endre = qr/.{$len}\w{0,$add_len}/;
1757 my $begre = qr/\w{0,$add_len}.{$len}/;
1758
1759 if ($where eq 'left') {
1760 $str =~ m/^(.*?)($begre)$/;
1761 my ($lead, $body) = ($1, $2);
1762 if (length($lead) > 4) {
1763 $lead = " ...";
1764 }
1765 return "$lead$body";
1766
1767 } elsif ($where eq 'center') {
1768 $str =~ m/^($endre)(.*)$/;
1769 my ($left, $str) = ($1, $2);
1770 $str =~ m/^(.*?)($begre)$/;
1771 my ($mid, $right) = ($1, $2);
1772 if (length($mid) > 5) {
1773 $mid = " ... ";
1774 }
1775 return "$left$mid$right";
1776
1777 } else {
1778 $str =~ m/^($endre)(.*)$/;
1779 my $body = $1;
1780 my $tail = $2;
1781 if (length($tail) > 4) {
1782 $tail = "... ";
1783 }
1784 return "$body$tail";
1785 }
1786 }
1787
1788 # takes the same arguments as chop_str, but also wraps a <span> around the
1789 # result with a title attribute if it does get chopped. Additionally, the
1790 # string is HTML-escaped.
1791 sub chop_and_escape_str {
1792 my ($str) = @_;
1793
1794 my $chopped = chop_str(@_);
1795 $str = to_utf8($str);
1796 if ($chopped eq $str) {
1797 return esc_html($chopped);
1798 } else {
1799 $str =~ s/[[:cntrl:]]/?/g;
1800 return $cgi->span({-title=>$str}, esc_html($chopped));
1801 }
1802 }
1803
1804 # Highlight selected fragments of string, using given CSS class,
1805 # and escape HTML. It is assumed that fragments do not overlap.
1806 # Regions are passed as list of pairs (array references).
1807 #
1808 # Example: esc_html_hl_regions("foobar", "mark", [ 0, 3 ]) returns
1809 # '<span class="mark">foo</span>bar'
1810 sub esc_html_hl_regions {
1811 my ($str, $css_class, @sel) = @_;
1812 my %opts = grep { ref($_) ne 'ARRAY' } @sel;
1813 @sel = grep { ref($_) eq 'ARRAY' } @sel;
1814 return esc_html($str, %opts) unless @sel;
1815
1816 my $out = '';
1817 my $pos = 0;
1818
1819 for my $s (@sel) {
1820 my ($begin, $end) = @$s;
1821
1822 # Don't create empty <span> elements.
1823 next if $end <= $begin;
1824
1825 my $escaped = esc_html(substr($str, $begin, $end - $begin),
1826 %opts);
1827
1828 $out .= esc_html(substr($str, $pos, $begin - $pos), %opts)
1829 if ($begin - $pos > 0);
1830 $out .= $cgi->span({-class => $css_class}, $escaped);
1831
1832 $pos = $end;
1833 }
1834 $out .= esc_html(substr($str, $pos), %opts)
1835 if ($pos < length($str));
1836
1837 return $out;
1838 }
1839
1840 # return positions of beginning and end of each match
1841 sub matchpos_list {
1842 my ($str, $regexp) = @_;
1843 return unless (defined $str && defined $regexp);
1844
1845 my @matches;
1846 while ($str =~ /$regexp/g) {
1847 push @matches, [$-[0], $+[0]];
1848 }
1849 return @matches;
1850 }
1851
1852 # highlight match (if any), and escape HTML
1853 sub esc_html_match_hl {
1854 my ($str, $regexp) = @_;
1855 return esc_html($str) unless defined $regexp;
1856
1857 my @matches = matchpos_list($str, $regexp);
1858 return esc_html($str) unless @matches;
1859
1860 return esc_html_hl_regions($str, 'match', @matches);
1861 }
1862
1863
1864 # highlight match (if any) of shortened string, and escape HTML
1865 sub esc_html_match_hl_chopped {
1866 my ($str, $chopped, $regexp) = @_;
1867 return esc_html_match_hl($str, $regexp) unless defined $chopped;
1868
1869 my @matches = matchpos_list($str, $regexp);
1870 return esc_html($chopped) unless @matches;
1871
1872 # filter matches so that we mark chopped string
1873 my $tail = "... "; # see chop_str
1874 unless ($chopped =~ s/\Q$tail\E$//) {
1875 $tail = '';
1876 }
1877 my $chop_len = length($chopped);
1878 my $tail_len = length($tail);
1879 my @filtered;
1880
1881 for my $m (@matches) {
1882 if ($m->[0] > $chop_len) {
1883 push @filtered, [ $chop_len, $chop_len + $tail_len ] if ($tail_len > 0);
1884 last;
1885 } elsif ($m->[1] > $chop_len) {
1886 push @filtered, [ $m->[0], $chop_len + $tail_len ];
1887 last;
1888 }
1889 push @filtered, $m;
1890 }
1891
1892 return esc_html_hl_regions($chopped . $tail, 'match', @filtered);
1893 }
1894
1895 ## ----------------------------------------------------------------------
1896 ## functions returning short strings
1897
1898 # CSS class for given age value (in seconds)
1899 sub age_class {
1900 my $age = shift;
1901
1902 if (!defined $age) {
1903 return "noage";
1904 } elsif ($age < 60*60*2) {
1905 return "age0";
1906 } elsif ($age < 60*60*24*2) {
1907 return "age1";
1908 } else {
1909 return "age2";
1910 }
1911 }
1912
1913 # convert age in seconds to "nn units ago" string
1914 sub age_string {
1915 my $age = shift;
1916 my $age_str;
1917
1918 if ($age > 60*60*24*365*2) {
1919 $age_str = (int $age/60/60/24/365);
1920 $age_str .= " years ago";
1921 } elsif ($age > 60*60*24*(365/12)*2) {
1922 $age_str = int $age/60/60/24/(365/12);
1923 $age_str .= " months ago";
1924 } elsif ($age > 60*60*24*7*2) {
1925 $age_str = int $age/60/60/24/7;
1926 $age_str .= " weeks ago";
1927 } elsif ($age > 60*60*24*2) {
1928 $age_str = int $age/60/60/24;
1929 $age_str .= " days ago";
1930 } elsif ($age > 60*60*2) {
1931 $age_str = int $age/60/60;
1932 $age_str .= " hours ago";
1933 } elsif ($age > 60*2) {
1934 $age_str = int $age/60;
1935 $age_str .= " min ago";
1936 } elsif ($age > 2) {
1937 $age_str = int $age;
1938 $age_str .= " sec ago";
1939 } else {
1940 $age_str .= " right now";
1941 }
1942 return $age_str;
1943 }
1944
1945 use constant {
1946 S_IFINVALID => 0030000,
1947 S_IFGITLINK => 0160000,
1948 };
1949
1950 # submodule/subproject, a commit object reference
1951 sub S_ISGITLINK {
1952 my $mode = shift;
1953
1954 return (($mode & S_IFMT) == S_IFGITLINK)
1955 }
1956
1957 # convert file mode in octal to symbolic file mode string
1958 sub mode_str {
1959 my $mode = oct shift;
1960
1961 if (S_ISGITLINK($mode)) {
1962 return 'm---------';
1963 } elsif (S_ISDIR($mode & S_IFMT)) {
1964 return 'drwxr-xr-x';
1965 } elsif (S_ISLNK($mode)) {
1966 return 'lrwxrwxrwx';
1967 } elsif (S_ISREG($mode)) {
1968 # git cares only about the executable bit
1969 if ($mode & S_IXUSR) {
1970 return '-rwxr-xr-x';
1971 } else {
1972 return '-rw-r--r--';
1973 };
1974 } else {
1975 return '----------';
1976 }
1977 }
1978
1979 # convert file mode in octal to file type string
1980 sub file_type {
1981 my $mode = shift;
1982
1983 if ($mode !~ m/^[0-7]+$/) {
1984 return $mode;
1985 } else {
1986 $mode = oct $mode;
1987 }
1988
1989 if (S_ISGITLINK($mode)) {
1990 return "submodule";
1991 } elsif (S_ISDIR($mode & S_IFMT)) {
1992 return "directory";
1993 } elsif (S_ISLNK($mode)) {
1994 return "symlink";
1995 } elsif (S_ISREG($mode)) {
1996 return "file";
1997 } else {
1998 return "unknown";
1999 }
2000 }
2001
2002 # convert file mode in octal to file type description string
2003 sub file_type_long {
2004 my $mode = shift;
2005
2006 if ($mode !~ m/^[0-7]+$/) {
2007 return $mode;
2008 } else {
2009 $mode = oct $mode;
2010 }
2011
2012 if (S_ISGITLINK($mode)) {
2013 return "submodule";
2014 } elsif (S_ISDIR($mode & S_IFMT)) {
2015 return "directory";
2016 } elsif (S_ISLNK($mode)) {
2017 return "symlink";
2018 } elsif (S_ISREG($mode)) {
2019 if ($mode & S_IXUSR) {
2020 return "executable";
2021 } else {
2022 return "file";
2023 };
2024 } else {
2025 return "unknown";
2026 }
2027 }
2028
2029
2030 ## ----------------------------------------------------------------------
2031 ## functions returning short HTML fragments, or transforming HTML fragments
2032 ## which don't belong to other sections
2033
2034 # format line of commit message.
2035 sub format_log_line_html {
2036 my $line = shift;
2037
2038 $line = esc_html($line, -nbsp=>1);
2039 $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
2040 $cgi->a({-href => href(action=>"object", hash=>$1),
2041 -class => "text"}, $1);
2042 }eg;
2043
2044 return $line;
2045 }
2046
2047 # format marker of refs pointing to given object
2048
2049 # the destination action is chosen based on object type and current context:
2050 # - for annotated tags, we choose the tag view unless it's the current view
2051 # already, in which case we go to shortlog view
2052 # - for other refs, we keep the current view if we're in history, shortlog or
2053 # log view, and select shortlog otherwise
2054 sub format_ref_marker {
2055 my ($refs, $id) = @_;
2056 my $markers = '';
2057
2058 if (defined $refs->{$id}) {
2059 foreach my $ref (@{$refs->{$id}}) {
2060 # this code exploits the fact that non-lightweight tags are the
2061 # only indirect objects, and that they are the only objects for which
2062 # we want to use tag instead of shortlog as action
2063 my ($type, $name) = qw();
2064 my $indirect = ($ref =~ s/\^\{\}$//);
2065 # e.g. tags/v2.6.11 or heads/next
2066 if ($ref =~ m!^(.*?)s?/(.*)$!) {
2067 $type = $1;
2068 $name = $2;
2069 } else {
2070 $type = "ref";
2071 $name = $ref;
2072 }
2073
2074 my $class = $type;
2075 $class .= " indirect" if $indirect;
2076
2077 my $dest_action = "shortlog";
2078
2079 if ($indirect) {
2080 $dest_action = "tag" unless $action eq "tag";
2081 } elsif ($action =~ /^(history|(short)?log)$/) {
2082 $dest_action = $action;
2083 }
2084
2085 my $dest = "";
2086 $dest .= "refs/" unless $ref =~ m!^refs/!;
2087 $dest .= $ref;
2088
2089 my $link = $cgi->a({
2090 -href => href(
2091 action=>$dest_action,
2092 hash=>$dest
2093 )}, $name);
2094
2095 $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
2096 $link . "</span>";
2097 }
2098 }
2099
2100 if ($markers) {
2101 return ' <span class="refs">'. $markers . '</span>';
2102 } else {
2103 return "";
2104 }
2105 }
2106
2107 # format, perhaps shortened and with markers, title line
2108 sub format_subject_html {
2109 my ($long, $short, $href, $extra) = @_;
2110 $extra = '' unless defined($extra);
2111
2112 if (length($short) < length($long)) {
2113 $long =~ s/[[:cntrl:]]/?/g;
2114 return $cgi->a({-href => $href, -class => "list subject",
2115 -title => to_utf8($long)},
2116 esc_html($short)) . $extra;
2117 } else {
2118 return $cgi->a({-href => $href, -class => "list subject"},
2119 esc_html($long)) . $extra;
2120 }
2121 }
2122
2123 # Rather than recomputing the url for an email multiple times, we cache it
2124 # after the first hit. This gives a visible benefit in views where the avatar
2125 # for the same email is used repeatedly (e.g. shortlog).
2126 # The cache is shared by all avatar engines (currently gravatar only), which
2127 # are free to use it as preferred. Since only one avatar engine is used for any
2128 # given page, there's no risk for cache conflicts.
2129 our %avatar_cache = ();
2130
2131 # Compute the picon url for a given email, by using the picon search service over at
2132 # http://www.cs.indiana.edu/picons/search.html
2133 sub picon_url {
2134 my $email = lc shift;
2135 if (!$avatar_cache{$email}) {
2136 my ($user, $domain) = split('@', $email);
2137 $avatar_cache{$email} =
2138 "//www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
2139 "$domain/$user/" .
2140 "users+domains+unknown/up/single";
2141 }
2142 return $avatar_cache{$email};
2143 }
2144
2145 # Compute the gravatar url for a given email, if it's not in the cache already.
2146 # Gravatar stores only the part of the URL before the size, since that's the
2147 # one computationally more expensive. This also allows reuse of the cache for
2148 # different sizes (for this particular engine).
2149 sub gravatar_url {
2150 my $email = lc shift;
2151 my $size = shift;
2152 $avatar_cache{$email} ||=
2153 "//www.gravatar.com/avatar/" .
2154 Digest::MD5::md5_hex($email) . "?s=";
2155 return $avatar_cache{$email} . $size;
2156 }
2157
2158 # Insert an avatar for the given $email at the given $size if the feature
2159 # is enabled.
2160 sub git_get_avatar {
2161 my ($email, %opts) = @_;
2162 my $pre_white = ($opts{-pad_before} ? "&nbsp;" : "");
2163 my $post_white = ($opts{-pad_after} ? "&nbsp;" : "");
2164 $opts{-size} ||= 'default';
2165 my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
2166 my $url = "";
2167 if ($git_avatar eq 'gravatar') {
2168 $url = gravatar_url($email, $size);
2169 } elsif ($git_avatar eq 'picon') {
2170 $url = picon_url($email);
2171 }
2172 # Other providers can be added by extending the if chain, defining $url
2173 # as needed. If no variant puts something in $url, we assume avatars
2174 # are completely disabled/unavailable.
2175 if ($url) {
2176 return $pre_white .
2177 "<img width=\"$size\" " .
2178 "class=\"avatar\" " .
2179 "src=\"".esc_url($url)."\" " .
2180 "alt=\"\" " .
2181 "/>" . $post_white;
2182 } else {
2183 return "";
2184 }
2185 }
2186
2187 sub format_search_author {
2188 my ($author, $searchtype, $displaytext) = @_;
2189 my $have_search = gitweb_check_feature('search');
2190
2191 if ($have_search) {
2192 my $performed = "";
2193 if ($searchtype eq 'author') {
2194 $performed = "authored";
2195 } elsif ($searchtype eq 'committer') {
2196 $performed = "committed";
2197 }
2198
2199 return $cgi->a({-href => href(action=>"search", hash=>$hash,
2200 searchtext=>$author,
2201 searchtype=>$searchtype), class=>"list",
2202 title=>"Search for commits $performed by $author"},
2203 $displaytext);
2204
2205 } else {
2206 return $displaytext;
2207 }
2208 }
2209
2210 # format the author name of the given commit with the given tag
2211 # the author name is chopped and escaped according to the other
2212 # optional parameters (see chop_str).
2213 sub format_author_html {
2214 my $tag = shift;
2215 my $co = shift;
2216 my $author = chop_and_escape_str($co->{'author_name'}, @_);
2217 return "<$tag class=\"author\">" .
2218 format_search_author($co->{'author_name'}, "author",
2219 git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2220 $author) .
2221 "</$tag>";
2222 }
2223
2224 # format git diff header line, i.e. "diff --(git|combined|cc) ..."
2225 sub format_git_diff_header_line {
2226 my $line = shift;
2227 my $diffinfo = shift;
2228 my ($from, $to) = @_;
2229
2230 if ($diffinfo->{'nparents'}) {
2231 # combined diff
2232 $line =~ s!^(diff (.*?) )"?.*$!$1!;
2233 if ($to->{'href'}) {
2234 $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2235 esc_path($to->{'file'}));
2236 } else { # file was deleted (no href)
2237 $line .= esc_path($to->{'file'});
2238 }
2239 } else {
2240 # "ordinary" diff
2241 $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2242 if ($from->{'href'}) {
2243 $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2244 'a/' . esc_path($from->{'file'}));
2245 } else { # file was added (no href)
2246 $line .= 'a/' . esc_path($from->{'file'});
2247 }
2248 $line .= ' ';
2249 if ($to->{'href'}) {
2250 $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2251 'b/' . esc_path($to->{'file'}));
2252 } else { # file was deleted
2253 $line .= 'b/' . esc_path($to->{'file'});
2254 }
2255 }
2256
2257 return "<div class=\"diff header\">$line</div>\n";
2258 }
2259
2260 # format extended diff header line, before patch itself
2261 sub format_extended_diff_header_line {
2262 my $line = shift;
2263 my $diffinfo = shift;
2264 my ($from, $to) = @_;
2265
2266 # match <path>
2267 if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2268 $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2269 esc_path($from->{'file'}));
2270 }
2271 if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2272 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2273 esc_path($to->{'file'}));
2274 }
2275 # match single <mode>
2276 if ($line =~ m/\s(\d{6})$/) {
2277 $line .= '<span class="info"> (' .
2278 file_type_long($1) .
2279 ')</span>';
2280 }
2281 # match <hash>
2282 if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2283 # can match only for combined diff
2284 $line = 'index ';
2285 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2286 if ($from->{'href'}[$i]) {
2287 $line .= $cgi->a({-href=>$from->{'href'}[$i],
2288 -class=>"hash"},
2289 substr($diffinfo->{'from_id'}[$i],0,7));
2290 } else {
2291 $line .= '0' x 7;
2292 }
2293 # separator
2294 $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2295 }
2296 $line .= '..';
2297 if ($to->{'href'}) {
2298 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2299 substr($diffinfo->{'to_id'},0,7));
2300 } else {
2301 $line .= '0' x 7;
2302 }
2303
2304 } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2305 # can match only for ordinary diff
2306 my ($from_link, $to_link);
2307 if ($from->{'href'}) {
2308 $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2309 substr($diffinfo->{'from_id'},0,7));
2310 } else {
2311 $from_link = '0' x 7;
2312 }
2313 if ($to->{'href'}) {
2314 $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2315 substr($diffinfo->{'to_id'},0,7));
2316 } else {
2317 $to_link = '0' x 7;
2318 }
2319 my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2320 $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2321 }
2322
2323 return $line . "<br/>\n";
2324 }
2325
2326 # format from-file/to-file diff header
2327 sub format_diff_from_to_header {
2328 my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2329 my $line;
2330 my $result = '';
2331
2332 $line = $from_line;
2333 #assert($line =~ m/^---/) if DEBUG;
2334 # no extra formatting for "^--- /dev/null"
2335 if (! $diffinfo->{'nparents'}) {
2336 # ordinary (single parent) diff
2337 if ($line =~ m!^--- "?a/!) {
2338 if ($from->{'href'}) {
2339 $line = '--- a/' .
2340 $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2341 esc_path($from->{'file'}));
2342 } else {
2343 $line = '--- a/' .
2344 esc_path($from->{'file'});
2345 }
2346 }
2347 $result .= qq!<div class="diff from_file">$line</div>\n!;
2348
2349 } else {
2350 # combined diff (merge commit)
2351 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2352 if ($from->{'href'}[$i]) {
2353 $line = '--- ' .
2354 $cgi->a({-href=>href(action=>"blobdiff",
2355 hash_parent=>$diffinfo->{'from_id'}[$i],
2356 hash_parent_base=>$parents[$i],
2357 file_parent=>$from->{'file'}[$i],
2358 hash=>$diffinfo->{'to_id'},
2359 hash_base=>$hash,
2360 file_name=>$to->{'file'}),
2361 -class=>"path",
2362 -title=>"diff" . ($i+1)},
2363 $i+1) .
2364 '/' .
2365 $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2366 esc_path($from->{'file'}[$i]));
2367 } else {
2368 $line = '--- /dev/null';
2369 }
2370 $result .= qq!<div class="diff from_file">$line</div>\n!;
2371 }
2372 }
2373
2374 $line = $to_line;
2375 #assert($line =~ m/^\+\+\+/) if DEBUG;
2376 # no extra formatting for "^+++ /dev/null"
2377 if ($line =~ m!^\+\+\+ "?b/!) {
2378 if ($to->{'href'}) {
2379 $line = '+++ b/' .
2380 $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2381 esc_path($to->{'file'}));
2382 } else {
2383 $line = '+++ b/' .
2384 esc_path($to->{'file'});
2385 }
2386 }
2387 $result .= qq!<div class="diff to_file">$line</div>\n!;
2388
2389 return $result;
2390 }
2391
2392 # create note for patch simplified by combined diff
2393 sub format_diff_cc_simplified {
2394 my ($diffinfo, @parents) = @_;
2395 my $result = '';
2396
2397 $result .= "<div class=\"diff header\">" .
2398 "diff --cc ";
2399 if (!is_deleted($diffinfo)) {
2400 $result .= $cgi->a({-href => href(action=>"blob",
2401 hash_base=>$hash,
2402 hash=>$diffinfo->{'to_id'},
2403 file_name=>$diffinfo->{'to_file'}),
2404 -class => "path"},
2405 esc_path($diffinfo->{'to_file'}));
2406 } else {
2407 $result .= esc_path($diffinfo->{'to_file'});
2408 }
2409 $result .= "</div>\n" . # class="diff header"
2410 "<div class=\"diff nodifferences\">" .
2411 "Simple merge" .
2412 "</div>\n"; # class="diff nodifferences"
2413
2414 return $result;
2415 }
2416
2417 sub diff_line_class {
2418 my ($line, $from, $to) = @_;
2419
2420 # ordinary diff
2421 my $num_sign = 1;
2422 # combined diff
2423 if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2424 $num_sign = scalar @{$from->{'href'}};
2425 }
2426
2427 my @diff_line_classifier = (
2428 { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2429 { regexp => qr/^\\/, class => "incomplete" },
2430 { regexp => qr/^ {$num_sign}/, class => "ctx" },
2431 # classifier for context must come before classifier add/rem,
2432 # or we would have to use more complicated regexp, for example
2433 # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2434 { regexp => qr/^[+ ]{$num_sign}/, class => "add" },
2435 { regexp => qr/^[- ]{$num_sign}/, class => "rem" },
2436 );
2437 for my $clsfy (@diff_line_classifier) {
2438 return $clsfy->{'class'}
2439 if ($line =~ $clsfy->{'regexp'});
2440 }
2441
2442 # fallback
2443 return "";
2444 }
2445
2446 # assumes that $from and $to are defined and correctly filled,
2447 # and that $line holds a line of chunk header for unified diff
2448 sub format_unidiff_chunk_header {
2449 my ($line, $from, $to) = @_;
2450
2451 my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2452 $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2453
2454 $from_lines = 0 unless defined $from_lines;
2455 $to_lines = 0 unless defined $to_lines;
2456
2457 if ($from->{'href'}) {
2458 $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2459 -class=>"list"}, $from_text);
2460 }
2461 if ($to->{'href'}) {
2462 $to_text = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2463 -class=>"list"}, $to_text);
2464 }
2465 $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2466 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2467 return $line;
2468 }
2469
2470 # assumes that $from and $to are defined and correctly filled,
2471 # and that $line holds a line of chunk header for combined diff
2472 sub format_cc_diff_chunk_header {
2473 my ($line, $from, $to) = @_;
2474
2475 my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2476 my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2477
2478 @from_text = split(' ', $ranges);
2479 for (my $i = 0; $i < @from_text; ++$i) {
2480 ($from_start[$i], $from_nlines[$i]) =
2481 (split(',', substr($from_text[$i], 1)), 0);
2482 }
2483
2484 $to_text = pop @from_text;
2485 $to_start = pop @from_start;
2486 $to_nlines = pop @from_nlines;
2487
2488 $line = "<span class=\"chunk_info\">$prefix ";
2489 for (my $i = 0; $i < @from_text; ++$i) {
2490 if ($from->{'href'}[$i]) {
2491 $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2492 -class=>"list"}, $from_text[$i]);
2493 } else {
2494 $line .= $from_text[$i];
2495 }
2496 $line .= " ";
2497 }
2498 if ($to->{'href'}) {
2499 $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2500 -class=>"list"}, $to_text);
2501 } else {
2502 $line .= $to_text;
2503 }
2504 $line .= " $prefix</span>" .
2505 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2506 return $line;
2507 }
2508
2509 # process patch (diff) line (not to be used for diff headers),
2510 # returning HTML-formatted (but not wrapped) line.
2511 # If the line is passed as a reference, it is treated as HTML and not
2512 # esc_html()'ed.
2513 sub format_diff_line {
2514 my ($line, $diff_class, $from, $to) = @_;
2515
2516 if (ref($line)) {
2517 $line = $$line;
2518 } else {
2519 chomp $line;
2520 $line = untabify($line);
2521
2522 if ($from && $to && $line =~ m/^\@{2} /) {
2523 $line = format_unidiff_chunk_header($line, $from, $to);
2524 } elsif ($from && $to && $line =~ m/^\@{3}/) {
2525 $line = format_cc_diff_chunk_header($line, $from, $to);
2526 } else {
2527 $line = esc_html($line, -nbsp=>1);
2528 }
2529 }
2530
2531 my $diff_classes = "diff";
2532 $diff_classes .= " $diff_class" if ($diff_class);
2533 $line = "<div class=\"$diff_classes\">$line</div>\n";
2534
2535 return $line;
2536 }
2537
2538 # Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2539 # linked. Pass the hash of the tree/commit to snapshot.
2540 sub format_snapshot_links {
2541 my ($hash) = @_;
2542 my $num_fmts = @snapshot_fmts;
2543 if ($num_fmts > 1) {
2544 # A parenthesized list of links bearing format names.
2545 # e.g. "snapshot (_tar.gz_ _zip_)"
2546 return "snapshot (" . join(' ', map
2547 $cgi->a({
2548 -href => href(
2549 action=>"snapshot",
2550 hash=>$hash,
2551 snapshot_format=>$_
2552 )
2553 }, $known_snapshot_formats{$_}{'display'})
2554 , @snapshot_fmts) . ")";
2555 } elsif ($num_fmts == 1) {
2556 # A single "snapshot" link whose tooltip bears the format name.
2557 # i.e. "_snapshot_"
2558 my ($fmt) = @snapshot_fmts;
2559 return
2560 $cgi->a({
2561 -href => href(
2562 action=>"snapshot",
2563 hash=>$hash,
2564 snapshot_format=>$fmt
2565 ),
2566 -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2567 }, "snapshot");
2568 } else { # $num_fmts == 0
2569 return undef;
2570 }
2571 }
2572
2573 ## ......................................................................
2574 ## functions returning values to be passed, perhaps after some
2575 ## transformation, to other functions; e.g. returning arguments to href()
2576
2577 # returns hash to be passed to href to generate gitweb URL
2578 # in -title key it returns description of link
2579 sub get_feed_info {
2580 my $format = shift || 'Atom';
2581 my %res = (action => lc($format));
2582 my $matched_ref = 0;
2583
2584 # feed links are possible only for project views
2585 return unless (defined $project);
2586 # some views should link to OPML, or to generic project feed,
2587 # or don't have specific feed yet (so they should use generic)
2588 return if (!$action || $action =~ /^(?:tags|heads|forks|tag|search)$/x);
2589
2590 my $branch = undef;
2591 # branches refs uses 'refs/' + $get_branch_refs()[x] + '/' prefix
2592 # (fullname) to differentiate from tag links; this also makes
2593 # possible to detect branch links
2594 for my $ref (get_branch_refs()) {
2595 if ((defined $hash_base && $hash_base =~ m!^refs/\Q$ref\E/(.*)$!) ||
2596 (defined $hash && $hash =~ m!^refs/\Q$ref\E/(.*)$!)) {
2597 $branch = $1;
2598 $matched_ref = $ref;
2599 last;
2600 }
2601 }
2602 # find log type for feed description (title)
2603 my $type = 'log';
2604 if (defined $file_name) {
2605 $type = "history of $file_name";
2606 $type .= "/" if ($action eq 'tree');
2607 $type .= " on '$branch'" if (defined $branch);
2608 } else {
2609 $type = "log of $branch" if (defined $branch);
2610 }
2611
2612 $res{-title} = $type;
2613 $res{'hash'} = (defined $branch ? "refs/$matched_ref/$branch" : undef);
2614 $res{'file_name'} = $file_name;
2615
2616 return %res;
2617 }
2618
2619 ## ----------------------------------------------------------------------
2620 ## git utility subroutines, invoking git commands
2621
2622 # returns path to the core git executable and the --git-dir parameter as list
2623 sub git_cmd {
2624 $number_of_git_cmds++;
2625 return $GIT, '--git-dir='.$git_dir;
2626 }
2627
2628 # quote the given arguments for passing them to the shell
2629 # quote_command("command", "arg 1", "arg with ' and ! characters")
2630 # => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2631 # Try to avoid using this function wherever possible.
2632 sub quote_command {
2633 return join(' ',
2634 map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2635 }
2636
2637 # get HEAD ref of given project as hash
2638 sub git_get_head_hash {
2639 return git_get_full_hash(shift, 'HEAD');
2640 }
2641
2642 sub git_get_full_hash {
2643 return git_get_hash(@_);
2644 }
2645
2646 sub git_get_short_hash {
2647 return git_get_hash(@_, '--short=7');
2648 }
2649
2650 sub git_get_hash {
2651 my ($project, $hash, @options) = @_;
2652 my $o_git_dir = $git_dir;
2653 my $retval = undef;
2654 $git_dir = "$projectroot/$project";
2655 if (open my $fd, '-|', git_cmd(), 'rev-parse',
2656 '--verify', '-q', @options, $hash) {
2657 $retval = <$fd>;
2658 chomp $retval if defined $retval;
2659 close $fd;
2660 }
2661 if (defined $o_git_dir) {
2662 $git_dir = $o_git_dir;
2663 }
2664 return $retval;
2665 }
2666
2667 # get type of given object
2668 sub git_get_type {
2669 my $hash = shift;
2670
2671 open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2672 my $type = <$fd>;
2673 close $fd or return;
2674 chomp $type;
2675 return $type;
2676 }
2677
2678 # repository configuration
2679 our $config_file = '';
2680 our %config;
2681
2682 # store multiple values for single key as anonymous array reference
2683 # single values stored directly in the hash, not as [ <value> ]
2684 sub hash_set_multi {
2685 my ($hash, $key, $value) = @_;
2686
2687 if (!exists $hash->{$key}) {
2688 $hash->{$key} = $value;
2689 } elsif (!ref $hash->{$key}) {
2690 $hash->{$key} = [ $hash->{$key}, $value ];
2691 } else {
2692 push @{$hash->{$key}}, $value;
2693 }
2694 }
2695
2696 # return hash of git project configuration
2697 # optionally limited to some section, e.g. 'gitweb'
2698 sub git_parse_project_config {
2699 my $section_regexp = shift;
2700 my %config;
2701
2702 local $/ = "\0";
2703
2704 open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2705 or return;
2706
2707 while (my $keyval = <$fh>) {
2708 chomp $keyval;
2709 my ($key, $value) = split(/\n/, $keyval, 2);
2710
2711 hash_set_multi(\%config, $key, $value)
2712 if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2713 }
2714 close $fh;
2715
2716 return %config;
2717 }
2718
2719 # convert config value to boolean: 'true' or 'false'
2720 # no value, number > 0, 'true' and 'yes' values are true
2721 # rest of values are treated as false (never as error)
2722 sub config_to_bool {
2723 my $val = shift;
2724
2725 return 1 if !defined $val; # section.key
2726
2727 # strip leading and trailing whitespace
2728 $val =~ s/^\s+//;
2729 $val =~ s/\s+$//;
2730
2731 return (($val =~ /^\d+$/ && $val) || # section.key = 1
2732 ($val =~ /^(?:true|yes)$/i)); # section.key = true
2733 }
2734
2735 # convert config value to simple decimal number
2736 # an optional value suffix of 'k', 'm', or 'g' will cause the value
2737 # to be multiplied by 1024, 1048576, or 1073741824
2738 sub config_to_int {
2739 my $val = shift;
2740
2741 # strip leading and trailing whitespace
2742 $val =~ s/^\s+//;
2743 $val =~ s/\s+$//;
2744
2745 if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2746 $unit = lc($unit);
2747 # unknown unit is treated as 1
2748 return $num * ($unit eq 'g' ? 1073741824 :
2749 $unit eq 'm' ? 1048576 :
2750 $unit eq 'k' ? 1024 : 1);
2751 }
2752 return $val;
2753 }
2754
2755 # convert config value to array reference, if needed
2756 sub config_to_multi {
2757 my $val = shift;
2758
2759 return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2760 }
2761
2762 sub git_get_project_config {
2763 my ($key, $type) = @_;
2764
2765 return unless defined $git_dir;
2766
2767 # key sanity check
2768 return unless ($key);
2769 # only subsection, if exists, is case sensitive,
2770 # and not lowercased by 'git config -z -l'
2771 if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2772 $lo =~ s/_//g;
2773 $key = join(".", lc($hi), $mi, lc($lo));
2774 return if ($lo =~ /\W/ || $hi =~ /\W/);
2775 } else {
2776 $key = lc($key);
2777 $key =~ s/_//g;
2778 return if ($key =~ /\W/);
2779 }
2780 $key =~ s/^gitweb\.//;
2781
2782 # type sanity check
2783 if (defined $type) {
2784 $type =~ s/^--//;
2785 $type = undef
2786 unless ($type eq 'bool' || $type eq 'int');
2787 }
2788
2789 # get config
2790 if (!defined $config_file ||
2791 $config_file ne "$git_dir/config") {
2792 %config = git_parse_project_config('gitweb');
2793 $config_file = "$git_dir/config";
2794 }
2795
2796 # check if config variable (key) exists
2797 return unless exists $config{"gitweb.$key"};
2798
2799 # ensure given type
2800 if (!defined $type) {
2801 return $config{"gitweb.$key"};
2802 } elsif ($type eq 'bool') {
2803 # backward compatibility: 'git config --bool' returns true/false
2804 return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2805 } elsif ($type eq 'int') {
2806 return config_to_int($config{"gitweb.$key"});
2807 }
2808 return $config{"gitweb.$key"};
2809 }
2810
2811 # get hash of given path at given ref
2812 sub git_get_hash_by_path {
2813 my $base = shift;
2814 my $path = shift || return undef;
2815 my $type = shift;
2816
2817 $path =~ s,/+$,,;
2818
2819 open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2820 or die_error(500, "Open git-ls-tree failed");
2821 my $line = <$fd>;
2822 close $fd or return undef;
2823
2824 if (!defined $line) {
2825 # there is no tree or hash given by $path at $base
2826 return undef;
2827 }
2828
2829 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa panic.c'
2830 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2831 if (defined $type && $type ne $2) {
2832 # type doesn't match
2833 return undef;
2834 }
2835 return $3;
2836 }
2837
2838 # get path of entry with given hash at given tree-ish (ref)
2839 # used to get 'from' filename for combined diff (merge commit) for renames
2840 sub git_get_path_by_hash {
2841 my $base = shift || return;
2842 my $hash = shift || return;
2843
2844 local $/ = "\0";
2845
2846 open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2847 or return undef;
2848 while (my $line = <$fd>) {
2849 chomp $line;
2850
2851 #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423 gitweb'
2852 #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f gitweb/README'
2853 if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2854 close $fd;
2855 return $1;
2856 }
2857 }
2858 close $fd;
2859 return undef;
2860 }
2861
2862 ## ......................................................................
2863 ## git utility functions, directly accessing git repository
2864
2865 # get the value of config variable either from file named as the variable
2866 # itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2867 # configuration variable in the repository config file.
2868 sub git_get_file_or_project_config {
2869 my ($path, $name) = @_;
2870
2871 $git_dir = "$projectroot/$path";
2872 open my $fd, '<', "$git_dir/$name"
2873 or return git_get_project_config($name);
2874 my $conf = <$fd>;
2875 close $fd;
2876 if (defined $conf) {
2877 chomp $conf;
2878 }
2879 return $conf;
2880 }
2881
2882 sub git_get_project_description {
2883 my $path = shift;
2884 return git_get_file_or_project_config($path, 'description');
2885 }
2886
2887 sub git_get_project_category {
2888 my $path = shift;
2889 return git_get_file_or_project_config($path, 'category');
2890 }
2891
2892
2893 # supported formats:
2894 # * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2895 # - if its contents is a number, use it as tag weight,
2896 # - otherwise add a tag with weight 1
2897 # * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2898 # the same value multiple times increases tag weight
2899 # * `gitweb.ctag' multi-valued repo config variable
2900 sub git_get_project_ctags {
2901 my $project = shift;
2902 my $ctags = {};
2903
2904 $git_dir = "$projectroot/$project";
2905 if (opendir my $dh, "$git_dir/ctags") {
2906 my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2907 foreach my $tagfile (@files) {
2908 open my $ct, '<', $tagfile
2909 or next;
2910 my $val = <$ct>;
2911 chomp $val if $val;
2912 close $ct;
2913
2914 (my $ctag = $tagfile) =~ s#.*/##;
2915 if ($val =~ /^\d+$/) {
2916 $ctags->{$ctag} = $val;
2917 } else {
2918 $ctags->{$ctag} = 1;
2919 }
2920 }
2921 closedir $dh;
2922
2923 } elsif (open my $fh, '<', "$git_dir/ctags") {
2924 while (my $line = <$fh>) {
2925 chomp $line;
2926 $ctags->{$line}++ if $line;
2927 }
2928 close $fh;
2929
2930 } else {
2931 my $taglist = config_to_multi(git_get_project_config('ctag'));
2932 foreach my $tag (@$taglist) {
2933 $ctags->{$tag}++;
2934 }
2935 }
2936
2937 return $ctags;
2938 }
2939
2940 # return hash, where keys are content tags ('ctags'),
2941 # and values are sum of weights of given tag in every project
2942 sub git_gather_all_ctags {
2943 my $projects = shift;
2944 my $ctags = {};
2945
2946 foreach my $p (@$projects) {
2947 foreach my $ct (keys %{$p->{'ctags'}}) {
2948 $ctags->{$ct} += $p->{'ctags'}->{$ct};
2949 }
2950 }
2951
2952 return $ctags;
2953 }
2954
2955 sub git_populate_project_tagcloud {
2956 my $ctags = shift;
2957
2958 # First, merge different-cased tags; tags vote on casing
2959 my %ctags_lc;
2960 foreach (keys %$ctags) {
2961 $ctags_lc{lc $_}->{count} += $ctags->{$_};
2962 if (not $ctags_lc{lc $_}->{topcount}
2963 or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2964 $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2965 $ctags_lc{lc $_}->{topname} = $_;
2966 }
2967 }
2968
2969 my $cloud;
2970 my $matched = $input_params{'ctag'};
2971 if (eval { require HTML::TagCloud; 1; }) {
2972 $cloud = HTML::TagCloud->new;
2973 foreach my $ctag (sort keys %ctags_lc) {
2974 # Pad the title with spaces so that the cloud looks
2975 # less crammed.
2976 my $title = esc_html($ctags_lc{$ctag}->{topname});
2977 $title =~ s/ /&nbsp;/g;
2978 $title =~ s/^/&nbsp;/g;
2979 $title =~ s/$/&nbsp;/g;
2980 if (defined $matched && $matched eq $ctag) {
2981 $title = qq(<span class="match">$title</span>);
2982 }
2983 $cloud->add($title, href(project=>undef, ctag=>$ctag),
2984 $ctags_lc{$ctag}->{count});
2985 }
2986 } else {
2987 $cloud = {};
2988 foreach my $ctag (keys %ctags_lc) {
2989 my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2990 if (defined $matched && $matched eq $ctag) {
2991 $title = qq(<span class="match">$title</span>);
2992 }
2993 $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2994 $cloud->{$ctag}{ctag} =
2995 $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2996 }
2997 }
2998 return $cloud;
2999 }
3000
3001 sub git_show_project_tagcloud {
3002 my ($cloud, $count) = @_;
3003 if (ref $cloud eq 'HTML::TagCloud') {
3004 return $cloud->html_and_css($count);
3005 } else {
3006 my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
3007 return
3008 '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
3009 join (', ', map {
3010 $cloud->{$_}->{'ctag'}
3011 } splice(@tags, 0, $count)) .
3012 '</div>';
3013 }
3014 }
3015
3016 sub git_get_project_url_list {
3017 my $path = shift;
3018
3019 $git_dir = "$projectroot/$path";
3020 open my $fd, '<', "$git_dir/cloneurl"
3021 or return wantarray ?
3022 @{ config_to_multi(git_get_project_config('url')) } :
3023 config_to_multi(git_get_project_config('url'));
3024 my @git_project_url_list = map { chomp; $_ } <$fd>;
3025 close $fd;
3026
3027 return wantarray ? @git_project_url_list : \@git_project_url_list;
3028 }
3029
3030 sub git_get_projects_list {
3031 my $filter = shift || '';
3032 my $paranoid = shift;
3033 my @list;
3034
3035 if (-d $projects_list) {
3036 # search in directory
3037 my $dir = $projects_list;
3038 # remove the trailing "/"
3039 $dir =~ s!/+$!!;
3040 my $pfxlen = length("$dir");
3041 my $pfxdepth = ($dir =~ tr!/!!);
3042 # when filtering, search only given subdirectory
3043 if ($filter && !$paranoid) {
3044 $dir .= "/$filter";
3045 $dir =~ s!/+$!!;
3046 }
3047
3048 File::Find::find({
3049 follow_fast => 1, # follow symbolic links
3050 follow_skip => 2, # ignore duplicates
3051 dangling_symlinks => 0, # ignore dangling symlinks, silently
3052 wanted => sub {
3053 # global variables
3054 our $project_maxdepth;
3055 our $projectroot;
3056 # skip project-list toplevel, if we get it.
3057 return if (m!^[/.]$!);
3058 # only directories can be git repositories
3059 return unless (-d $_);
3060 # don't traverse too deep (Find is super slow on os x)
3061 # $project_maxdepth excludes depth of $projectroot
3062 if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
3063 $File::Find::prune = 1;
3064 return;
3065 }
3066
3067 my $path = substr($File::Find::name, $pfxlen + 1);
3068 # paranoidly only filter here
3069 if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
3070 next;
3071 }
3072 # we check related file in $projectroot
3073 if (check_export_ok("$projectroot/$path")) {
3074 push @list, { path => $path };
3075 $File::Find::prune = 1;
3076 }
3077 },
3078 }, "$dir");
3079
3080 } elsif (-f $projects_list) {
3081 # read from file(url-encoded):
3082 # 'git%2Fgit.git Linus+Torvalds'
3083 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3084 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3085 open my $fd, '<', $projects_list or return;
3086 PROJECT:
3087 while (my $line = <$fd>) {
3088 chomp $line;
3089 my ($path, $owner) = split ' ', $line;
3090 $path = unescape($path);
3091 $owner = unescape($owner);
3092 if (!defined $path) {
3093 next;
3094 }
3095 # if $filter is rpovided, check if $path begins with $filter
3096 if ($filter && $path !~ m!^\Q$filter\E/!) {
3097 next;
3098 }
3099 if (check_export_ok("$projectroot/$path")) {
3100 my $pr = {
3101 path => $path
3102 };
3103 if ($owner) {
3104 $pr->{'owner'} = to_utf8($owner);
3105 }
3106 push @list, $pr;
3107 }
3108 }
3109 close $fd;
3110 }
3111 return @list;
3112 }
3113
3114 # written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
3115 # as side effects it sets 'forks' field to list of forks for forked projects
3116 sub filter_forks_from_projects_list {
3117 my $projects = shift;
3118
3119 my %trie; # prefix tree of directories (path components)
3120 # generate trie out of those directories that might contain forks
3121 foreach my $pr (@$projects) {
3122 my $path = $pr->{'path'};
3123 $path =~ s/\.git$//; # forks of 'repo.git' are in 'repo/' directory
3124 next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
3125 next unless ($path); # skip '.git' repository: tests, git-instaweb
3126 next unless (-d "$projectroot/$path"); # containing directory exists
3127 $pr->{'forks'} = []; # there can be 0 or more forks of project
3128
3129 # add to trie
3130 my @dirs = split('/', $path);
3131 # walk the trie, until either runs out of components or out of trie
3132 my $ref = \%trie;
3133 while (scalar @dirs &&
3134 exists($ref->{$dirs[0]})) {
3135 $ref = $ref->{shift @dirs};
3136 }
3137 # create rest of trie structure from rest of components
3138 foreach my $dir (@dirs) {
3139 $ref = $ref->{$dir} = {};
3140 }
3141 # create end marker, store $pr as a data
3142 $ref->{''} = $pr if (!exists $ref->{''});
3143 }
3144
3145 # filter out forks, by finding shortest prefix match for paths
3146 my @filtered;
3147 PROJECT:
3148 foreach my $pr (@$projects) {
3149 # trie lookup
3150 my $ref = \%trie;
3151 DIR:
3152 foreach my $dir (split('/', $pr->{'path'})) {
3153 if (exists $ref->{''}) {
3154 # found [shortest] prefix, is a fork - skip it
3155 push @{$ref->{''}{'forks'}}, $pr;
3156 next PROJECT;
3157 }
3158 if (!exists $ref->{$dir}) {
3159 # not in trie, cannot have prefix, not a fork
3160 push @filtered, $pr;
3161 next PROJECT;
3162 }
3163 # If the dir is there, we just walk one step down the trie.
3164 $ref = $ref->{$dir};
3165 }
3166 # we ran out of trie
3167 # (shouldn't happen: it's either no match, or end marker)
3168 push @filtered, $pr;
3169 }
3170
3171 return @filtered;
3172 }
3173
3174 # note: fill_project_list_info must be run first,
3175 # for 'descr_long' and 'ctags' to be filled
3176 sub search_projects_list {
3177 my ($projlist, %opts) = @_;
3178 my $tagfilter = $opts{'tagfilter'};
3179 my $search_re = $opts{'search_regexp'};
3180
3181 return @$projlist
3182 unless ($tagfilter || $search_re);
3183
3184 # searching projects require filling to be run before it;
3185 fill_project_list_info($projlist,
3186 $tagfilter ? 'ctags' : (),
3187 $search_re ? ('path', 'descr') : ());
3188 my @projects;
3189 PROJECT:
3190 foreach my $pr (@$projlist) {
3191
3192 if ($tagfilter) {
3193 next unless ref($pr->{'ctags'}) eq 'HASH';
3194 next unless
3195 grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
3196 }
3197
3198 if ($search_re) {
3199 next unless
3200 $pr->{'path'} =~ /$search_re/ ||
3201 $pr->{'descr_long'} =~ /$search_re/;
3202 }
3203
3204 push @projects, $pr;
3205 }
3206
3207 return @projects;
3208 }
3209
3210 our $gitweb_project_owner = undef;
3211 sub git_get_project_list_from_file {
3212
3213 return if (defined $gitweb_project_owner);
3214
3215 $gitweb_project_owner = {};
3216 # read from file (url-encoded):
3217 # 'git%2Fgit.git Linus+Torvalds'
3218 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3219 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3220 if (-f $projects_list) {
3221 open(my $fd, '<', $projects_list);
3222 while (my $line = <$fd>) {
3223 chomp $line;
3224 my ($pr, $ow) = split ' ', $line;
3225 $pr = unescape($pr);
3226 $ow = unescape($ow);
3227 $gitweb_project_owner->{$pr} = to_utf8($ow);
3228 }
3229 close $fd;
3230 }
3231 }
3232
3233 sub git_get_project_owner {
3234 my $project = shift;
3235 my $owner;
3236
3237 return undef unless $project;
3238 $git_dir = "$projectroot/$project";
3239
3240 if (!defined $gitweb_project_owner) {
3241 git_get_project_list_from_file();
3242 }
3243
3244 if (exists $gitweb_project_owner->{$project}) {
3245 $owner = $gitweb_project_owner->{$project};
3246 }
3247 if (!defined $owner){
3248 $owner = git_get_project_config('owner');
3249 }
3250 if (!defined $owner) {
3251 $owner = get_file_owner("$git_dir");
3252 }
3253
3254 return $owner;
3255 }
3256
3257 sub git_get_last_activity {
3258 my ($path) = @_;
3259 my $fd;
3260
3261 $git_dir = "$projectroot/$path";
3262 open($fd, "-|", git_cmd(), 'for-each-ref',
3263 '--format=%(committer)',
3264 '--sort=-committerdate',
3265 '--count=1',
3266 map { "refs/$_" } get_branch_refs ()) or return;
3267 my $most_recent = <$fd>;
3268 close $fd or return;
3269 if (defined $most_recent &&
3270 $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3271 my $timestamp = $1;
3272 my $age = time - $timestamp;
3273 return ($age, age_string($age));
3274 }
3275 return (undef, undef);
3276 }
3277
3278 # Implementation note: when a single remote is wanted, we cannot use 'git
3279 # remote show -n' because that command always work (assuming it's a remote URL
3280 # if it's not defined), and we cannot use 'git remote show' because that would
3281 # try to make a network roundtrip. So the only way to find if that particular
3282 # remote is defined is to walk the list provided by 'git remote -v' and stop if
3283 # and when we find what we want.
3284 sub git_get_remotes_list {
3285 my $wanted = shift;
3286 my %remotes = ();
3287
3288 open my $fd, '-|' , git_cmd(), 'remote', '-v';
3289 return unless $fd;
3290 while (my $remote = <$fd>) {
3291 chomp $remote;
3292 $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3293 next if $wanted and not $remote eq $wanted;
3294 my ($url, $key) = ($1, $2);
3295
3296 $remotes{$remote} ||= { 'heads' => () };
3297 $remotes{$remote}{$key} = $url;
3298 }
3299 close $fd or return;
3300 return wantarray ? %remotes : \%remotes;
3301 }
3302
3303 # Takes a hash of remotes as first parameter and fills it by adding the
3304 # available remote heads for each of the indicated remotes.
3305 sub fill_remote_heads {
3306 my $remotes = shift;
3307 my @heads = map { "remotes/$_" } keys %$remotes;
3308 my @remoteheads = git_get_heads_list(undef, @heads);
3309 foreach my $remote (keys %$remotes) {
3310 $remotes->{$remote}{'heads'} = [ grep {
3311 $_->{'name'} =~ s!^$remote/!!
3312 } @remoteheads ];
3313 }
3314 }
3315
3316 sub git_get_references {
3317 my $type = shift || "";
3318 my %refs;
3319 # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3320 # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3321 open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3322 ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3323 or return;
3324
3325 while (my $line = <$fd>) {
3326 chomp $line;
3327 if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3328 if (defined $refs{$1}) {
3329 push @{$refs{$1}}, $2;
3330 } else {
3331 $refs{$1} = [ $2 ];
3332 }
3333 }
3334 }
3335 close $fd or return;
3336 return \%refs;
3337 }
3338
3339 sub git_get_rev_name_tags {
3340 my $hash = shift || return undef;
3341
3342 open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3343 or return;
3344 my $name_rev = <$fd>;
3345 close $fd;
3346
3347 if ($name_rev =~ m|^$hash tags/(.*)$|) {
3348 return $1;
3349 } else {
3350 # catches also '$hash undefined' output
3351 return undef;
3352 }
3353 }
3354
3355 ## ----------------------------------------------------------------------
3356 ## parse to hash functions
3357
3358 sub parse_date {
3359 my $epoch = shift;
3360 my $tz = shift || "-0000";
3361
3362 my %date;
3363 my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3364 my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3365 my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3366 $date{'hour'} = $hour;
3367 $date{'minute'} = $min;
3368 $date{'mday'} = $mday;
3369 $date{'day'} = $days[$wday];
3370 $date{'month'} = $months[$mon];
3371 $date{'rfc2822'} = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3372 $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3373 $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3374 $mday, $months[$mon], $hour ,$min;
3375 $date{'iso-8601'} = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3376 1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3377
3378 my ($tz_sign, $tz_hour, $tz_min) =
3379 ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3380 $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3381 my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3382 ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3383 $date{'hour_local'} = $hour;
3384 $date{'minute_local'} = $min;
3385 $date{'tz_local'} = $tz;
3386 $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3387 1900+$year, $mon+1, $mday,
3388 $hour, $min, $sec, $tz);
3389 return %date;
3390 }
3391
3392 sub parse_tag {
3393 my $tag_id = shift;
3394 my %tag;
3395 my @comment;
3396
3397 open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3398 $tag{'id'} = $tag_id;
3399 while (my $line = <$fd>) {
3400 chomp $line;
3401 if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3402 $tag{'object'} = $1;
3403 } elsif ($line =~ m/^type (.+)$/) {
3404 $tag{'type'} = $1;
3405 } elsif ($line =~ m/^tag (.+)$/) {
3406 $tag{'name'} = $1;
3407 } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3408 $tag{'author'} = $1;
3409 $tag{'author_epoch'} = $2;
3410 $tag{'author_tz'} = $3;
3411 if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3412 $tag{'author_name'} = $1;
3413 $tag{'author_email'} = $2;
3414 } else {
3415 $tag{'author_name'} = $tag{'author'};
3416 }
3417 } elsif ($line =~ m/--BEGIN/) {
3418 push @comment, $line;
3419 last;
3420 } elsif ($line eq "") {
3421 last;
3422 }
3423 }
3424 push @comment, <$fd>;
3425 $tag{'comment'} = \@comment;
3426 close $fd or return;
3427 if (!defined $tag{'name'}) {
3428 return
3429 };
3430 return %tag
3431 }
3432
3433 sub parse_commit_text {
3434 my ($commit_text, $withparents) = @_;
3435 my @commit_lines = split '\n', $commit_text;
3436 my %co;
3437
3438 pop @commit_lines; # Remove '\0'
3439
3440 if (! @commit_lines) {
3441 return;
3442 }
3443
3444 my $header = shift @commit_lines;
3445 if ($header !~ m/^[0-9a-fA-F]{40}/) {
3446 return;
3447 }
3448 ($co{'id'}, my @parents) = split ' ', $header;
3449 while (my $line = shift @commit_lines) {
3450 last if $line eq "\n";
3451 if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3452 $co{'tree'} = $1;
3453 } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3454 push @parents, $1;
3455 } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3456 $co{'author'} = to_utf8($1);
3457 $co{'author_epoch'} = $2;
3458 $co{'author_tz'} = $3;
3459 if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3460 $co{'author_name'} = $1;
3461 $co{'author_email'} = $2;
3462 } else {
3463 $co{'author_name'} = $co{'author'};
3464 }
3465 } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3466 $co{'committer'} = to_utf8($1);
3467 $co{'committer_epoch'} = $2;
3468 $co{'committer_tz'} = $3;
3469 if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3470 $co{'committer_name'} = $1;
3471 $co{'committer_email'} = $2;
3472 } else {
3473 $co{'committer_name'} = $co{'committer'};
3474 }
3475 }
3476 }
3477 if (!defined $co{'tree'}) {
3478 return;
3479 };
3480 $co{'parents'} = \@parents;
3481 $co{'parent'} = $parents[0];
3482
3483 foreach my $title (@commit_lines) {
3484 $title =~ s/^ //;
3485 if ($title ne "") {
3486 $co{'title'} = chop_str($title, 80, 5);
3487 # remove leading stuff of merges to make the interesting part visible
3488 if (length($title) > 50) {
3489 $title =~ s/^Automatic //;
3490 $title =~ s/^merge (of|with) /Merge ... /i;
3491 if (length($title) > 50) {
3492 $title =~ s/(http|rsync):\/\///;
3493 }
3494 if (length($title) > 50) {
3495 $title =~ s/(master|www|rsync)\.//;
3496 }
3497 if (length($title) > 50) {
3498 $title =~ s/kernel.org:?//;
3499 }
3500 if (length($title) > 50) {
3501 $title =~ s/\/pub\/scm//;
3502 }
3503 }
3504 $co{'title_short'} = chop_str($title, 50, 5);
3505 last;
3506 }
3507 }
3508 if (! defined $co{'title'} || $co{'title'} eq "") {
3509 $co{'title'} = $co{'title_short'} = '(no commit message)';
3510 }
3511 # remove added spaces
3512 foreach my $line (@commit_lines) {
3513 $line =~ s/^ //;
3514 }
3515 $co{'comment'} = \@commit_lines;
3516
3517 my $age = time - $co{'committer_epoch'};
3518 $co{'age'} = $age;
3519 $co{'age_string'} = age_string($age);
3520 my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3521 if ($age > 60*60*24*7*2) {
3522 $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3523 $co{'age_string_age'} = $co{'age_string'};
3524 } else {
3525 $co{'age_string_date'} = $co{'age_string'};
3526 $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3527 }
3528 return %co;
3529 }
3530
3531 sub parse_commit {
3532 my ($commit_id) = @_;
3533 my %co;
3534
3535 local $/ = "\0";
3536
3537 open my $fd, "-|", git_cmd(), "rev-list",
3538 "--parents",
3539 "--header",
3540 "--max-count=1",
3541 $commit_id,
3542 "--",
3543 or die_error(500, "Open git-rev-list failed");
3544 %co = parse_commit_text(<$fd>, 1);
3545 close $fd;
3546
3547 return %co;
3548 }
3549
3550 sub parse_commits {
3551 my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3552 my @cos;
3553
3554 $maxcount ||= 1;
3555 $skip ||= 0;
3556
3557 local $/ = "\0";
3558
3559 open my $fd, "-|", git_cmd(), "rev-list",
3560 "--header",
3561 @args,
3562 ("--max-count=" . $maxcount),
3563 ("--skip=" . $skip),
3564 @extra_options,
3565 $commit_id,
3566 "--",
3567 ($filename ? ($filename) : ())
3568 or die_error(500, "Open git-rev-list failed");
3569 while (my $line = <$fd>) {
3570 my %co = parse_commit_text($line);
3571 push @cos, \%co;
3572 }
3573 close $fd;
3574
3575 return wantarray ? @cos : \@cos;
3576 }
3577
3578 # parse line of git-diff-tree "raw" output
3579 sub parse_difftree_raw_line {
3580 my $line = shift;
3581 my %res;
3582
3583 # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M ls-files.c'
3584 # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M rev-tree.c'
3585 if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3586 $res{'from_mode'} = $1;
3587 $res{'to_mode'} = $2;
3588 $res{'from_id'} = $3;
3589 $res{'to_id'} = $4;
3590 $res{'status'} = $5;
3591 $res{'similarity'} = $6;
3592 if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3593 ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3594 } else {
3595 $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3596 }
3597 }
3598 # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3599 # combined diff (for merge commit)
3600 elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3601 $res{'nparents'} = length($1);
3602 $res{'from_mode'} = [ split(' ', $2) ];
3603 $res{'to_mode'} = pop @{$res{'from_mode'}};
3604 $res{'from_id'} = [ split(' ', $3) ];
3605 $res{'to_id'} = pop @{$res{'from_id'}};
3606 $res{'status'} = [ split('', $4) ];
3607 $res{'to_file'} = unquote($5);
3608 }
3609 # 'c512b523472485aef4fff9e57b229d9d243c967f'
3610 elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3611 $res{'commit'} = $1;
3612 }
3613
3614 return wantarray ? %res : \%res;
3615 }
3616
3617 # wrapper: return parsed line of git-diff-tree "raw" output
3618 # (the argument might be raw line, or parsed info)
3619 sub parsed_difftree_line {
3620 my $line_or_ref = shift;
3621
3622 if (ref($line_or_ref) eq "HASH") {
3623 # pre-parsed (or generated by hand)
3624 return $line_or_ref;
3625 } else {
3626 return parse_difftree_raw_line($line_or_ref);
3627 }
3628 }
3629
3630 # parse line of git-ls-tree output
3631 sub parse_ls_tree_line {
3632 my $line = shift;
3633 my %opts = @_;
3634 my %res;
3635
3636 if ($opts{'-l'}) {
3637 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa 16717 panic.c'
3638 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3639
3640 $res{'mode'} = $1;
3641 $res{'type'} = $2;
3642 $res{'hash'} = $3;
3643 $res{'size'} = $4;
3644 if ($opts{'-z'}) {
3645 $res{'name'} = $5;
3646 } else {
3647 $res{'name'} = unquote($5);
3648 }
3649 } else {
3650 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa panic.c'
3651 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3652
3653 $res{'mode'} = $1;
3654 $res{'type'} = $2;
3655 $res{'hash'} = $3;
3656 if ($opts{'-z'}) {
3657 $res{'name'} = $4;
3658 } else {
3659 $res{'name'} = unquote($4);
3660 }
3661 }
3662
3663 return wantarray ? %res : \%res;
3664 }
3665
3666 # generates _two_ hashes, references to which are passed as 2 and 3 argument
3667 sub parse_from_to_diffinfo {
3668 my ($diffinfo, $from, $to, @parents) = @_;
3669
3670 if ($diffinfo->{'nparents'}) {
3671 # combined diff
3672 $from->{'file'} = [];
3673 $from->{'href'} = [];
3674 fill_from_file_info($diffinfo, @parents)
3675 unless exists $diffinfo->{'from_file'};
3676 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3677 $from->{'file'}[$i] =
3678 defined $diffinfo->{'from_file'}[$i] ?
3679 $diffinfo->{'from_file'}[$i] :
3680 $diffinfo->{'to_file'};
3681 if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3682 $from->{'href'}[$i] = href(action=>"blob",
3683 hash_base=>$parents[$i],
3684 hash=>$diffinfo->{'from_id'}[$i],
3685 file_name=>$from->{'file'}[$i]);
3686 } else {
3687 $from->{'href'}[$i] = undef;
3688 }
3689 }
3690 } else {
3691 # ordinary (not combined) diff
3692 $from->{'file'} = $diffinfo->{'from_file'};
3693 if ($diffinfo->{'status'} ne "A") { # not new (added) file
3694 $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3695 hash=>$diffinfo->{'from_id'},
3696 file_name=>$from->{'file'});
3697 } else {
3698 delete $from->{'href'};
3699 }
3700 }
3701
3702 $to->{'file'} = $diffinfo->{'to_file'};
3703 if (!is_deleted($diffinfo)) { # file exists in result
3704 $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3705 hash=>$diffinfo->{'to_id'},
3706 file_name=>$to->{'file'});
3707 } else {
3708 delete $to->{'href'};
3709 }
3710 }
3711
3712 ## ......................................................................
3713 ## parse to array of hashes functions
3714
3715 sub git_get_heads_list {
3716 my ($limit, @classes) = @_;
3717 @classes = get_branch_refs() unless @classes;
3718 my @patterns = map { "refs/$_" } @classes;
3719 my @headslist;
3720
3721 open my $fd, '-|', git_cmd(), 'for-each-ref',
3722 ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3723 '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3724 @patterns
3725 or return;
3726 while (my $line = <$fd>) {
3727 my %ref_item;
3728
3729 chomp $line;
3730 my ($refinfo, $committerinfo) = split(/\0/, $line);
3731 my ($hash, $name, $title) = split(' ', $refinfo, 3);
3732 my ($committer, $epoch, $tz) =
3733 ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3734 $ref_item{'fullname'} = $name;
3735 my $strip_refs = join '|', map { quotemeta } get_branch_refs();
3736 $name =~ s!^refs/($strip_refs|remotes)/!!;
3737 $ref_item{'name'} = $name;
3738 # for refs neither in 'heads' nor 'remotes' we want to
3739 # show their ref dir
3740 my $ref_dir = (defined $1) ? $1 : '';
3741 if ($ref_dir ne '' and $ref_dir ne 'heads' and $ref_dir ne 'remotes') {
3742 $ref_item{'name'} .= ' (' . $ref_dir . ')';
3743 }
3744
3745 $ref_item{'id'} = $hash;
3746 $ref_item{'title'} = $title || '(no commit message)';
3747 $ref_item{'epoch'} = $epoch;
3748 if ($epoch) {
3749 $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3750 } else {
3751 $ref_item{'age'} = "unknown";
3752 }
3753
3754 push @headslist, \%ref_item;
3755 }
3756 close $fd;
3757
3758 return wantarray ? @headslist : \@headslist;
3759 }
3760
3761 sub git_get_tags_list {
3762 my $limit = shift;
3763 my @tagslist;
3764
3765 open my $fd, '-|', git_cmd(), 'for-each-ref',
3766 ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3767 '--format=%(objectname) %(objecttype) %(refname) '.
3768 '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3769 'refs/tags'
3770 or return;
3771 while (my $line = <$fd>) {
3772 my %ref_item;
3773
3774 chomp $line;
3775 my ($refinfo, $creatorinfo) = split(/\0/, $line);
3776 my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3777 my ($creator, $epoch, $tz) =
3778 ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3779 $ref_item{'fullname'} = $name;
3780 $name =~ s!^refs/tags/!!;
3781
3782 $ref_item{'type'} = $type;
3783 $ref_item{'id'} = $id;
3784 $ref_item{'name'} = $name;
3785 if ($type eq "tag") {
3786 $ref_item{'subject'} = $title;
3787 $ref_item{'reftype'} = $reftype;
3788 $ref_item{'refid'} = $refid;
3789 } else {
3790 $ref_item{'reftype'} = $type;
3791 $ref_item{'refid'} = $id;
3792 }
3793
3794 if ($type eq "tag" || $type eq "commit") {
3795 $ref_item{'epoch'} = $epoch;
3796 if ($epoch) {
3797 $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3798 } else {
3799 $ref_item{'age'} = "unknown";
3800 }
3801 }
3802
3803 push @tagslist, \%ref_item;
3804 }
3805 close $fd;
3806
3807 return wantarray ? @tagslist : \@tagslist;
3808 }
3809
3810 ## ----------------------------------------------------------------------
3811 ## filesystem-related functions
3812
3813 sub get_file_owner {
3814 my $path = shift;
3815
3816 my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3817 my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3818 if (!defined $gcos) {
3819 return undef;
3820 }
3821 my $owner = $gcos;
3822 $owner =~ s/[,;].*$//;
3823 return to_utf8($owner);
3824 }
3825
3826 # assume that file exists
3827 sub insert_file {
3828 my $filename = shift;
3829
3830 open my $fd, '<', $filename;
3831 print map { to_utf8($_) } <$fd>;
3832 close $fd;
3833 }
3834
3835 ## ......................................................................
3836 ## mimetype related functions
3837
3838 sub mimetype_guess_file {
3839 my $filename = shift;
3840 my $mimemap = shift;
3841 -r $mimemap or return undef;
3842
3843 my %mimemap;
3844 open(my $mh, '<', $mimemap) or return undef;
3845 while (<$mh>) {
3846 next if m/^#/; # skip comments
3847 my ($mimetype, @exts) = split(/\s+/);
3848 foreach my $ext (@exts) {
3849 $mimemap{$ext} = $mimetype;
3850 }
3851 }
3852 close($mh);
3853
3854 $filename =~ /\.([^.]*)$/;
3855 return $mimemap{$1};
3856 }
3857
3858 sub mimetype_guess {
3859 my $filename = shift;
3860 my $mime;
3861 $filename =~ /\./ or return undef;
3862
3863 if ($mimetypes_file) {
3864 my $file = $mimetypes_file;
3865 if ($file !~ m!^/!) { # if it is relative path
3866 # it is relative to project
3867 $file = "$projectroot/$project/$file";
3868 }
3869 $mime = mimetype_guess_file($filename, $file);
3870 }
3871 $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3872 return $mime;
3873 }
3874
3875 sub blob_mimetype {
3876 my $fd = shift;
3877 my $filename = shift;
3878
3879 if ($filename) {
3880 my $mime = mimetype_guess($filename);
3881 $mime and return $mime;
3882 }
3883
3884 # just in case
3885 return $default_blob_plain_mimetype unless $fd;
3886
3887 if (-T $fd) {
3888 return 'text/plain';
3889 } elsif (! $filename) {
3890 return 'application/octet-stream';
3891 } elsif ($filename =~ m/\.png$/i) {
3892 return 'image/png';
3893 } elsif ($filename =~ m/\.gif$/i) {
3894 return 'image/gif';
3895 } elsif ($filename =~ m/\.jpe?g$/i) {
3896 return 'image/jpeg';
3897 } else {
3898 return 'application/octet-stream';
3899 }
3900 }
3901
3902 sub blob_contenttype {
3903 my ($fd, $file_name, $type) = @_;
3904
3905 $type ||= blob_mimetype($fd, $file_name);
3906 if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3907 $type .= "; charset=$default_text_plain_charset";
3908 }
3909
3910 return $type;
3911 }
3912
3913 # guess file syntax for syntax highlighting; return undef if no highlighting
3914 # the name of syntax can (in the future) depend on syntax highlighter used
3915 sub guess_file_syntax {
3916 my ($highlight, $mimetype, $file_name) = @_;
3917 return undef unless ($highlight && defined $file_name);
3918 my $basename = basename($file_name, '.in');
3919 return $highlight_basename{$basename}
3920 if exists $highlight_basename{$basename};
3921
3922 $basename =~ /\.([^.]*)$/;
3923 my $ext = $1 or return undef;
3924 return $highlight_ext{$ext}
3925 if exists $highlight_ext{$ext};
3926
3927 return undef;
3928 }
3929
3930 # run highlighter and return FD of its output,
3931 # or return original FD if no highlighting
3932 sub run_highlighter {
3933 my ($fd, $highlight, $syntax) = @_;
3934 return $fd unless ($highlight && defined $syntax);
3935
3936 close $fd;
3937 open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3938 quote_command($highlight_bin).
3939 " --replace-tabs=8 --fragment --syntax $syntax |"
3940 or die_error(500, "Couldn't open file or run syntax highlighter");
3941 return $fd;
3942 }
3943
3944 ## ======================================================================
3945 ## functions printing HTML: header, footer, error page
3946
3947 sub get_page_title {
3948 my $title = to_utf8($site_name);
3949
3950 unless (defined $project) {
3951 if (defined $project_filter) {
3952 $title .= " - projects in '" . esc_path($project_filter) . "'";
3953 }
3954 return $title;
3955 }
3956 $title .= " - " . to_utf8($project);
3957
3958 return $title unless (defined $action);
3959 $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3960
3961 return $title unless (defined $file_name);
3962 $title .= " - " . esc_path($file_name);
3963 if ($action eq "tree" && $file_name !~ m|/$|) {
3964 $title .= "/";
3965 }
3966
3967 return $title;
3968 }
3969
3970 sub get_content_type_html {
3971 # require explicit support from the UA if we are to send the page as
3972 # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3973 # we have to do this because MSIE sometimes globs '*/*', pretending to
3974 # support xhtml+xml but choking when it gets what it asked for.
3975 if (defined $cgi->http('HTTP_ACCEPT') &&
3976 $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3977 $cgi->Accept('application/xhtml+xml') != 0) {
3978 return 'application/xhtml+xml';
3979 } else {
3980 return 'text/html';
3981 }
3982 }
3983
3984 sub print_feed_meta {
3985 if (defined $project) {
3986 my %href_params = get_feed_info();
3987 if (!exists $href_params{'-title'}) {
3988 $href_params{'-title'} = 'log';
3989 }
3990
3991 foreach my $format (qw(RSS Atom)) {
3992 my $type = lc($format);
3993 my %link_attr = (
3994 '-rel' => 'alternate',
3995 '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3996 '-type' => "application/$type+xml"
3997 );
3998
3999 $href_params{'extra_options'} = undef;
4000 $href_params{'action'} = $type;
4001 $link_attr{'-href'} = href(%href_params);
4002 print "<link ".
4003 "rel=\"$link_attr{'-rel'}\" ".
4004 "title=\"$link_attr{'-title'}\" ".
4005 "href=\"$link_attr{'-href'}\" ".
4006 "type=\"$link_attr{'-type'}\" ".
4007 "/>\n";
4008
4009 $href_params{'extra_options'} = '--no-merges';
4010 $link_attr{'-href'} = href(%href_params);
4011 $link_attr{'-title'} .= ' (no merges)';
4012 print "<link ".
4013 "rel=\"$link_attr{'-rel'}\" ".
4014 "title=\"$link_attr{'-title'}\" ".
4015 "href=\"$link_attr{'-href'}\" ".
4016 "type=\"$link_attr{'-type'}\" ".
4017 "/>\n";
4018 }
4019
4020 } else {
4021 printf('<link rel="alternate" title="%s projects list" '.
4022 'href="%s" type="text/plain; charset=utf-8" />'."\n",
4023 esc_attr($site_name), href(project=>undef, action=>"project_index"));
4024 printf('<link rel="alternate" title="%s projects feeds" '.
4025 'href="%s" type="text/x-opml" />'."\n",
4026 esc_attr($site_name), href(project=>undef, action=>"opml"));
4027 }
4028 }
4029
4030 sub print_header_links {
4031 my $status = shift;
4032
4033 # print out each stylesheet that exist, providing backwards capability
4034 # for those people who defined $stylesheet in a config file
4035 if (defined $stylesheet) {
4036 print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
4037 } else {
4038 foreach my $stylesheet (@stylesheets) {
4039 next unless $stylesheet;
4040 print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
4041 }
4042 }
4043 print_feed_meta()
4044 if ($status eq '200 OK');
4045 if (defined $favicon) {
4046 print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
4047 }
4048 }
4049
4050 sub print_nav_breadcrumbs_path {
4051 my $dirprefix = undef;
4052 while (my $part = shift) {
4053 $dirprefix .= "/" if defined $dirprefix;
4054 $dirprefix .= $part;
4055 print $cgi->a({-href => href(project => undef,
4056 project_filter => $dirprefix,
4057 action => "project_list")},
4058 esc_html($part)) . " / ";
4059 }
4060 }
4061
4062 sub print_nav_breadcrumbs {
4063 my %opts = @_;
4064
4065 for my $crumb (@extra_breadcrumbs, [ $home_link_str => $home_link ]) {
4066 print $cgi->a({-href => esc_url($crumb->[1])}, $crumb->[0]) . " / ";
4067 }
4068 if (defined $project) {
4069 my @dirname = split '/', $project;
4070 my $projectbasename = pop @dirname;
4071 print_nav_breadcrumbs_path(@dirname);
4072 print $cgi->a({-href => href(action=>"summary")}, esc_html($projectbasename));
4073 if (defined $action) {
4074 my $action_print = $action ;
4075 if (defined $opts{-action_extra}) {
4076 $action_print = $cgi->a({-href => href(action=>$action)},
4077 $action);
4078 }
4079 print " / $action_print";
4080 }
4081 if (defined $opts{-action_extra}) {
4082 print " / $opts{-action_extra}";
4083 }
4084 print "\n";
4085 } elsif (defined $project_filter) {
4086 print_nav_breadcrumbs_path(split '/', $project_filter);
4087 }
4088 }
4089
4090 sub print_search_form {
4091 if (!defined $searchtext) {
4092 $searchtext = "";
4093 }
4094 my $search_hash;
4095 if (defined $hash_base) {
4096 $search_hash = $hash_base;
4097 } elsif (defined $hash) {
4098 $search_hash = $hash;
4099 } else {
4100 $search_hash = "HEAD";
4101 }
4102 my $action = $my_uri;
4103 my $use_pathinfo = gitweb_check_feature('pathinfo');
4104 if ($use_pathinfo) {
4105 $action .= "/".esc_url($project);
4106 }
4107 print $cgi->start_form(-method => "get", -action => $action) .
4108 "<div class=\"search\">\n" .
4109 (!$use_pathinfo &&
4110 $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
4111 $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
4112 $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
4113 $cgi->popup_menu(-name => 'st', -default => 'commit',
4114 -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
4115 " " . $cgi->a({-href => href(action=>"search_help"),
4116 -title => "search help" }, "?") . " search:\n",
4117 $cgi->textfield(-name => "s", -value => $searchtext, -override => 1) . "\n" .
4118 "<span title=\"Extended regular expression\">" .
4119 $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
4120 -checked => $search_use_regexp) .
4121 "</span>" .
4122 "</div>" .
4123 $cgi->end_form() . "\n";
4124 }
4125
4126 sub git_header_html {
4127 my $status = shift || "200 OK";
4128 my $expires = shift;
4129 my %opts = @_;
4130
4131 my $title = get_page_title();
4132 my $content_type = get_content_type_html();
4133 print $cgi->header(-type=>$content_type, -charset => 'utf-8',
4134 -status=> $status, -expires => $expires)
4135 unless ($opts{'-no_http_header'});
4136 my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
4137 print <<EOF;
4138 <?xml version="1.0" encoding="utf-8"?>
4139 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
4140 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
4141 <!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
4142 <!-- git core binaries version $git_version -->
4143 <head>
4144 <meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
4145 <meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
4146 <meta name="robots" content="index, nofollow"/>
4147 <title>$title</title>
4148 EOF
4149 # the stylesheet, favicon etc urls won't work correctly with path_info
4150 # unless we set the appropriate base URL
4151 if ($ENV{'PATH_INFO'}) {
4152 print "<base href=\"".esc_url($base_url)."\" />\n";
4153 }
4154 print_header_links($status);
4155
4156 if (defined $site_html_head_string) {
4157 print to_utf8($site_html_head_string);
4158 }
4159
4160 print "</head>\n" .
4161 "<body>\n";
4162
4163 if (defined $site_header && -f $site_header) {
4164 insert_file($site_header);
4165 }
4166
4167 print "<div class=\"page_header\">\n";
4168 if (defined $logo) {
4169 print $cgi->a({-href => esc_url($logo_url),
4170 -title => $logo_label},
4171 $cgi->img({-src => esc_url($logo),
4172 -width => 72, -height => 27,
4173 -alt => "git",
4174 -class => "logo"}));
4175 }
4176 print_nav_breadcrumbs(%opts);
4177 print "</div>\n";
4178
4179 my $have_search = gitweb_check_feature('search');
4180 if (defined $project && $have_search) {
4181 print_search_form();
4182 }
4183 }
4184
4185 sub git_footer_html {
4186 my $feed_class = 'rss_logo';
4187
4188 print "<div class=\"page_footer\">\n";
4189 if (defined $project) {
4190 my $descr = git_get_project_description($project);
4191 if (defined $descr) {
4192 print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
4193 }
4194
4195 my %href_params = get_feed_info();
4196 if (!%href_params) {
4197 $feed_class .= ' generic';
4198 }
4199 $href_params{'-title'} ||= 'log';
4200
4201 foreach my $format (qw(RSS Atom)) {
4202 $href_params{'action'} = lc($format);
4203 print $cgi->a({-href => href(%href_params),
4204 -title => "$href_params{'-title'} $format feed",
4205 -class => $feed_class}, $format)."\n";
4206 }
4207
4208 } else {
4209 print $cgi->a({-href => href(project=>undef, action=>"opml",
4210 project_filter => $project_filter),
4211 -class => $feed_class}, "OPML") . " ";
4212 print $cgi->a({-href => href(project=>undef, action=>"project_index",
4213 project_filter => $project_filter),
4214 -class => $feed_class}, "TXT") . "\n";
4215 }
4216 print "</div>\n"; # class="page_footer"
4217
4218 if (defined $t0 && gitweb_check_feature('timed')) {
4219 print "<div id=\"generating_info\">\n";
4220 print 'This page took '.
4221 '<span id="generating_time" class="time_span">'.
4222 tv_interval($t0, [ gettimeofday() ]).
4223 ' seconds </span>'.
4224 ' and '.
4225 '<span id="generating_cmd">'.
4226 $number_of_git_cmds.
4227 '</span> git commands '.
4228 " to generate.\n";
4229 print "</div>\n"; # class="page_footer"
4230 }
4231
4232 if (defined $site_footer && -f $site_footer) {
4233 insert_file($site_footer);
4234 }
4235
4236 print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
4237 if (defined $action &&
4238 $action eq 'blame_incremental') {
4239 print qq!<script type="text/javascript">\n!.
4240 qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
4241 qq! "!. href() .qq!");\n!.
4242 qq!</script>\n!;
4243 } else {
4244 my ($jstimezone, $tz_cookie, $datetime_class) =
4245 gitweb_get_feature('javascript-timezone');
4246
4247 print qq!<script type="text/javascript">\n!.
4248 qq!window.onload = function () {\n!;
4249 if (gitweb_check_feature('javascript-actions')) {
4250 print qq! fixLinks();\n!;
4251 }
4252 if ($jstimezone && $tz_cookie && $datetime_class) {
4253 print qq! var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4254 qq! onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4255 }
4256 print qq!};\n!.
4257 qq!</script>\n!;
4258 }
4259
4260 print "</body>\n" .
4261 "</html>";
4262 }
4263
4264 # die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4265 # Example: die_error(404, 'Hash not found')
4266 # By convention, use the following status codes (as defined in RFC 2616):
4267 # 400: Invalid or missing CGI parameters, or
4268 # requested object exists but has wrong type.
4269 # 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4270 # this server or project.
4271 # 404: Requested object/revision/project doesn't exist.
4272 # 500: The server isn't configured properly, or
4273 # an internal error occurred (e.g. failed assertions caused by bugs), or
4274 # an unknown error occurred (e.g. the git binary died unexpectedly).
4275 # 503: The server is currently unavailable (because it is overloaded,
4276 # or down for maintenance). Generally, this is a temporary state.
4277 sub die_error {
4278 my $status = shift || 500;
4279 my $error = esc_html(shift) || "Internal Server Error";
4280 my $extra = shift;
4281 my %opts = @_;
4282
4283 my %http_responses = (
4284 400 => '400 Bad Request',
4285 403 => '403 Forbidden',
4286 404 => '404 Not Found',
4287 500 => '500 Internal Server Error',
4288 503 => '503 Service Unavailable',
4289 );
4290 git_header_html($http_responses{$status}, undef, %opts);
4291 print <<EOF;
4292 <div class="page_body">
4293 <br /><br />
4294 $status - $error
4295 <br />
4296 EOF
4297 if (defined $extra) {
4298 print "<hr />\n" .
4299 "$extra\n";
4300 }
4301 print "</div>\n";
4302
4303 git_footer_html();
4304 goto DONE_GITWEB
4305 unless ($opts{'-error_handler'});
4306 }
4307
4308 ## ----------------------------------------------------------------------
4309 ## functions printing or outputting HTML: navigation
4310
4311 sub git_print_page_nav {
4312 my ($current, $suppress, $head, $treehead