Merge branch 'nd/untracked-cache'
[git.git] / gitweb / gitweb.perl
Commit [+]AuthorDateLineData
161332a5
KS
Kay Sievers2005-08-07 19:49:46 +02001#!/usr/bin/perl
2
c994d620 Kay Sievers2005-08-07 20:27:18 +02003# gitweb - simple web interface to track changes in git repositories
22fafb99 Kay Sievers2005-08-07 19:56:59 +02004#
00cd0794
KS
Kay Sievers2006-05-22 14:30:47 +02005# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
6# (C) 2005, Christian Gierke
823d5dc8 Kay Sievers2005-08-07 19:57:58 +02007#
d8f1c5c2 Kay Sievers2005-10-04 01:12:47 +02008# This program is licensed under the GPLv2
161332a5 Kay Sievers2005-08-07 19:49:46 +02009
d48b2841 Ævar Arnfjörð Bjarmason2010-09-24 20:00:52 +000010use 5.008;
161332a5
KS
Kay Sievers2005-08-07 19:49:46 +020011use strict;
12use warnings;
19806691 Kay Sievers2005-08-07 20:26:27 +020013use CGI qw(:standard :escapeHTML -nosticky);
7403d50b Kay Sievers2005-08-07 20:23:49 +020014use CGI::Util qw(unescape);
7a597457 Jakub Narębski2010-04-24 16:00:04 +020015use CGI::Carp qw(fatalsToBrowser set_message);
40c13813 Kay Sievers2005-11-19 17:41:29 +010016use Encode;
b87d78d6 Kay Sievers2005-08-07 20:21:04 +020017use Fcntl ':mode';
7a13b999 Junio C Hamano2006-07-31 19:18:34 -070018use File::Find qw();
cb9c6e5b Aneesh Kumar K.V2006-08-17 20:59:46 +053019use File::Basename qw(basename);
3962f1d7 Jakub Narębski2010-11-09 19:27:54 +010020use Time::HiRes qw(gettimeofday tv_interval);
10bb9036 Kay Sievers2005-11-23 04:26:40 +010021binmode STDOUT, ':utf8';
161332a5 Kay Sievers2005-08-07 19:49:46 +020022
13dbf46a
JK
Jeff King2014-11-18 12:10:22 -050023if (!defined($CGI::VERSION) || $CGI::VERSION < 4.08) {
24 eval 'sub CGI::multi_param { CGI::param(@_) }'
25}
26
3962f1d7 Jakub Narębski2010-11-09 19:27:54 +010027our $t0 = [ gettimeofday() ];
aa7dd05e
JN
Jakub Narębski2009-09-01 13:39:16 +020028our $number_of_git_cmds = 0;
29
b1f5f64f Jakub Narębski2006-12-28 00:00:52 +010030BEGIN {
3be8e720 Jakub Narębski2007-04-01 22:22:21 +020031 CGI->compile() if $ENV{'MOD_PERL'};
b1f5f64f
JN
Jakub Narębski2006-12-28 00:00:52 +010032}
33
06c084d2 Junio C Hamano2006-08-02 13:50:20 -070034our $version = "++GIT_VERSION++";
3e029299 Kay Sievers2005-08-07 20:05:15 +020035
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +020036our ($my_url, $my_uri, $base_url, $path_info, $home_link);
37sub evaluate_uri {
38 our $cgi;
81d3fe9f Giuseppe Bilotta2009-02-15 10:18:36 +010039
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +020040 our $my_url = $cgi->url();
41 our $my_uri = $cgi->url(-absolute => 1);
42
43 # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
44 # needed and used only for URLs with nonempty PATH_INFO
45 our $base_url = $my_url;
46
47 # When the script is used as DirectoryIndex, the URL does not contain the name
48 # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
49 # have to do it ourselves. We make $path_info global because it's also used
50 # later on.
51 #
52 # Another issue with the script being the DirectoryIndex is that the resulting
53 # $my_url data is not the full script URL: this is good, because we want
54 # generated links to keep implying the script name if it wasn't explicitly
55 # indicated in the URL we're handling, but it means that $my_url cannot be used
56 # as base URL.
57 # Therefore, if we needed to strip PATH_INFO, then we know that we have
58 # to build the base URL ourselves:
84d9e2d5 Jakub Narębski2012-02-03 13:44:54 +010059 our $path_info = decode_utf8($ENV{"PATH_INFO"});
c2394fe9 Jakub Narębski2010-05-07 14:54:04 +020060 if ($path_info) {
cacfc09b
JS
Jay Soffian2012-08-08 22:29:26 -040061 # $path_info has already been URL-decoded by the web server, but
62 # $my_url and $my_uri have not. URL-decode them so we can properly
63 # strip $path_info.
64 $my_url = unescape($my_url);
65 $my_uri = unescape($my_uri);
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +020066 if ($my_url =~ s,\Q$path_info\E$,, &&
67 $my_uri =~ s,\Q$path_info\E$,, &&
68 defined $ENV{'SCRIPT_NAME'}) {
69 $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
70 }
81d3fe9f Giuseppe Bilotta2009-02-15 10:18:36 +010071 }
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +020072
73 # target of the home link on top of all pages
74 our $home_link = $my_uri || "/";
b65910fe
GB
Giuseppe Bilotta2008-09-29 15:07:42 +020075}
76
e130ddaa
AT
Alp Toker2006-07-12 23:55:10 +010077# core git executable to use
78# this can just be "git" if your webserver has a sensible PATH
06c084d2 Junio C Hamano2006-08-02 13:50:20 -070079our $GIT = "++GIT_BINDIR++/git";
3f7f2710 Jakub Narębski2006-06-21 09:48:04 +020080
b87d78d6 Kay Sievers2005-08-07 20:21:04 +020081# absolute fs-path which will be prepended to the project path
4a87b43e Dennis Stosberg2006-06-21 15:07:08 +020082#our $projectroot = "/pub/scm";
06c084d2 Junio C Hamano2006-08-02 13:50:20 -070083our $projectroot = "++GITWEB_PROJECTROOT++";
b87d78d6 Kay Sievers2005-08-07 20:21:04 +020084
ca5e9495
LL
Luke Lu2007-10-16 20:45:25 -070085# fs traversing limit for getting project list
86# the number is relative to the projectroot
87our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
88
2de21fac
YS
Yasushi SHOJI2006-08-15 07:50:49 +090089# string of the home link on top of all pages
90our $home_link_str = "++GITWEB_HOME_LINK_STR++";
91
ad9c2e22
TF
Tony Finch2013-07-04 18:02:12 +010092# extra breadcrumbs preceding the home link
93our @extra_breadcrumbs = ();
94
49da1daf
AT
Alp Toker2006-07-11 21:10:26 +010095# name of your site or organization to appear in page titles
96# replace this with something more descriptive for clearer bookmarks
8be2890c
PB
Petr Baudis2006-10-24 05:18:39 +020097our $site_name = "++GITWEB_SITENAME++"
98 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
49da1daf Alp Toker2006-07-11 21:10:26 +010099
c1355b7f
LH
Lénaïc Huard2011-10-21 09:09:29 +0200100# html snippet to include in the <head> section of each page
101our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
b2d3476e
AC
Alan Chandler2006-10-03 13:49:03 +0100102# filename of html text to include at top of each page
103our $site_header = "++GITWEB_SITE_HEADER++";
8ab1da2c Kay Sievers2005-08-07 20:22:53 +0200104# html text to include at home page
06c084d2 Junio C Hamano2006-08-02 13:50:20 -0700105our $home_text = "++GITWEB_HOMETEXT++";
b2d3476e
AC
Alan Chandler2006-10-03 13:49:03 +0100106# filename of html text to include at bottom of each page
107our $site_footer = "++GITWEB_SITE_FOOTER++";
108
109# URI of stylesheets
110our @stylesheets = ("++GITWEB_CSS++");
887a612f
PB
Petr Baudis2006-10-26 14:41:25 +0200111# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
112our $stylesheet = undef;
9a7a62ff Jakub Narębski2006-10-06 12:31:05 +0200113# URI of GIT logo (72x27 size)
06c084d2 Junio C Hamano2006-08-02 13:50:20 -0700114our $logo = "++GITWEB_LOGO++";
0b5deba1
JN
Jakub Narębski2006-09-04 20:32:13 +0200115# URI of GIT favicon, assumed to be image/png type
116our $favicon = "++GITWEB_FAVICON++";
4af819d4
JN
Jakub Narębski2009-09-01 13:39:17 +0200117# URI of gitweb.js (JavaScript code for gitweb)
118our $javascript = "++GITWEB_JS++";
aedd9425 Jakub Narębski2006-06-17 11:23:56 +0200119
9a7a62ff
JN
Jakub Narębski2006-10-06 12:31:05 +0200120# URI and label (title) of GIT logo link
121#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
122#our $logo_label = "git documentation";
69fb8283 Wincent Colaiuta2009-07-12 14:31:28 +0200123our $logo_url = "http://git-scm.com/";
9a7a62ff Jakub Narębski2006-10-06 12:31:05 +0200124our $logo_label = "git homepage";
51a7c66a Junio C Hamano2006-09-23 12:36:01 -0700125
09bd7898 Kay Sievers2005-08-07 20:21:23 +0200126# source of projects list
06c084d2 Junio C Hamano2006-08-02 13:50:20 -0700127our $projects_list = "++GITWEB_LIST++";
b87d78d6 Kay Sievers2005-08-07 20:21:04 +0200128
55feb120
MH
Michael Hendricks2007-07-04 18:36:48 -0600129# the width (in characters) of the projects list "Description" column
130our $projects_list_description_width = 25;
131
d940c901
SC
Sebastien Cevey2011-04-29 19:52:01 +0200132# group projects by category on the projects list
133# (enabled if this variable evaluates to true)
134our $projects_list_group_categories = 0;
135
136# default category if none specified
137# (leave the empty string for no category)
138our $project_list_default_category = "";
139
b06dcf8c
FL
Frank Lichtenheld2007-04-06 23:58:24 +0200140# default order of projects list
141# valid values are none, project, descr, owner, and age
142our $default_projects_order = "project";
143
32f4aacc
ML
Matthias Lederhofer2006-09-17 00:31:01 +0200144# show repository only if this file exists
145# (only effective if this variable evaluates to true)
146our $export_ok = "++GITWEB_EXPORT_OK++";
147
5710be46
KK
Kacper Kornet2012-04-24 19:39:15 +0200148# don't generate age column on the projects list page
149our $omit_age_column = 0;
150
0ebe7827
KK
Kacper Kornet2012-04-26 18:45:44 +0200151# don't generate information about owners of repositories
152our $omit_owner=0;
153
dd7f5f10
AG
Alexander Gavrilov2008-11-06 01:36:23 +0300154# show repository only if this subroutine returns true
155# when given the path to the project, for example:
156# sub { return -e "$_[0]/git-daemon-export-ok"; }
157our $export_auth_hook = undef;
158
32f4aacc
ML
Matthias Lederhofer2006-09-17 00:31:01 +0200159# only allow viewing of repositories also shown on the overview page
160our $strict_export = "++GITWEB_STRICT_EXPORT++";
161
19a8721e
JN
Jakub Narębski2006-08-15 23:03:17 +0200162# list of git base URLs used for URL to where fetch project from,
163# i.e. full URL is "$git_base_url/$project"
d6b7e0b9 Jakub Narębski2006-10-26 12:26:44 +0200164our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
19a8721e Jakub Narębski2006-08-15 23:03:17 +0200165
f5aa79d9 Jakub Narębski2006-06-17 13:32:15 +0200166# default blob_plain mimetype and default charset for text/plain blob
4a87b43e
DS
Dennis Stosberg2006-06-21 15:07:08 +0200167our $default_blob_plain_mimetype = 'text/plain';
168our $default_text_plain_charset = undef;
f5aa79d9 Jakub Narębski2006-06-17 13:32:15 +0200169
2d007374
PB
Petr Baudis2006-06-18 00:01:06 +0200170# file to use for guessing MIME types before trying /etc/mime.types
171# (relative to the current git repository)
4a87b43e Dennis Stosberg2006-06-21 15:07:08 +0200172our $mimetypes_file = undef;
2d007374 Petr Baudis2006-06-18 00:01:06 +0200173
00f429af
MK
Martin Koegler2007-06-03 17:42:44 +0200174# assume this charset if line contains non-UTF-8 characters;
175# it should be valid encoding (see Encoding::Supported(3pm) for list),
176# for which encoding all byte sequences are valid, for example
177# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
178# could be even 'utf-8' for the old behavior)
179our $fallback_encoding = 'latin1';
180
69a9b41c
JN
Jakub Narębski2007-07-20 02:15:09 +0200181# rename detection options for git-diff and git-diff-tree
182# - default is '-M', with the cost proportional to
183# (number of removed files) * (number of new files).
184# - more costly is '-C' (which implies '-M'), with the cost proportional to
185# (number of changed files + number of removed files) * (number of new files)
186# - even more costly is '-C', '--find-copies-harder' with cost
187# (number of files in the original tree) * (number of new files)
188# - one might want to include '-B' option, e.g. '-B', '-M'
189our @diff_opts = ('-M'); # taken from git_commit
190
7e1100e9
MM
Matt McCutchen2009-02-07 19:00:09 -0500191# Disables features that would allow repository owners to inject script into
192# the gitweb domain.
193our $prevent_xss = 0;
194
7ce896b3
CW
Christopher Wilson2010-09-21 00:25:19 -0700195# Path to the highlight executable to use (must be the one from
196# http://www.andre-simon.de due to assumptions about parameters and output).
197# Useful if highlight is not installed on your webserver's PATH.
198# [Default: highlight]
199our $highlight_bin = "++HIGHLIGHT_BIN++";
200
a3c8ab30
MM
Matt McCutchen2007-07-22 01:30:27 +0200201# information about snapshot formats that gitweb is capable of serving
202our %known_snapshot_formats = (
203 # name => {
204 # 'display' => display name,
205 # 'type' => mime type,
206 # 'suffix' => filename suffix,
207 # 'format' => --format for git-archive,
208 # 'compressor' => [compressor command and arguments]
1bfd3631
MR
Mark Rada2009-08-06 10:25:39 -0400209 # (array reference, optional)
210 # 'disabled' => boolean (optional)}
a3c8ab30
MM
Matt McCutchen2007-07-22 01:30:27 +0200211 #
212 'tgz' => {
213 'display' => 'tar.gz',
214 'type' => 'application/x-gzip',
215 'suffix' => '.tar.gz',
216 'format' => 'tar',
0c8c385e Fraser Tweedale2011-04-26 11:32:00 +1000217 'compressor' => ['gzip', '-n']},
a3c8ab30
MM
Matt McCutchen2007-07-22 01:30:27 +0200218
219 'tbz2' => {
220 'display' => 'tar.bz2',
221 'type' => 'application/x-bzip2',
222 'suffix' => '.tar.bz2',
223 'format' => 'tar',
224 'compressor' => ['bzip2']},
225
cbdefb5a
MR
Mark Rada2009-08-06 10:28:25 -0400226 'txz' => {
227 'display' => 'tar.xz',
228 'type' => 'application/x-xz',
229 'suffix' => '.tar.xz',
230 'format' => 'tar',
231 'compressor' => ['xz'],
232 'disabled' => 1},
233
a3c8ab30
MM
Matt McCutchen2007-07-22 01:30:27 +0200234 'zip' => {
235 'display' => 'zip',
236 'type' => 'application/x-zip',
237 'suffix' => '.zip',
238 'format' => 'zip'},
239);
240
241# Aliases so we understand old gitweb.snapshot values in repository
242# configuration.
243our %known_snapshot_format_aliases = (
244 'gzip' => 'tgz',
245 'bzip2' => 'tbz2',
cbdefb5a Mark Rada2009-08-06 10:28:25 -0400246 'xz' => 'txz',
a3c8ab30
MM
Matt McCutchen2007-07-22 01:30:27 +0200247
248 # backward compatibility: legacy gitweb config support
249 'x-gzip' => undef, 'gz' => undef,
250 'x-bzip2' => undef, 'bz2' => undef,
251 'x-zip' => undef, '' => undef,
252);
253
e9fdd74e
GB
Giuseppe Bilotta2009-06-30 00:00:51 +0200254# Pixel sizes for icons and avatars. If the default font sizes or lineheights
255# are changed, it may be appropriate to change these values too via
256# $GITWEB_CONFIG.
257our %avatar_size = (
258 'default' => 16,
259 'double' => 32
260);
261
b62a1a98
JWH
John 'Warthog9' Hawley2010-01-30 23:30:39 +0100262# Used to set the maximum load that we will still respond to gitweb queries.
263# If server load exceed this value then return "503 server busy" error.
264# If gitweb cannot determined server load, it is taken to be 0.
265# Leave it undefined (or set to 'undef') to turn off load checking.
266our $maxload = 300;
267
61bf126e
AS
Alejandro R. Sedeño2010-07-28 14:40:53 -0400268# configuration for 'highlight' (http://www.andre-simon.de/)
269# match by basename
270our %highlight_basename = (
271 #'Program' => 'py',
272 #'Library' => 'py',
273 'SConstruct' => 'py', # SCons equivalent of Makefile
274 'Makefile' => 'make',
275);
276# match by extension
277our %highlight_ext = (
278 # main extensions, defining name of syntax;
279 # see files in /usr/share/highlight/langDefs/ directory
048b3991 Richard Hubbell2012-11-04 09:45:55 -0800280 (map { $_ => $_ } qw(py rb java css js tex bib xml awk bat ini spec tcl sql)),
61bf126e Alejandro R. Sedeño2010-07-28 14:40:53 -0400281 # alternate extensions, see /etc/highlight/filetypes.conf
048b3991
RH
Richard Hubbell2012-11-04 09:45:55 -0800282 (map { $_ => 'c' } qw(c h)),
283 (map { $_ => 'sh' } qw(sh bash zsh ksh)),
284 (map { $_ => 'cpp' } qw(cpp cxx c++ cc)),
285 (map { $_ => 'php' } qw(php php3 php4 php5 phps)),
286 (map { $_ => 'pl' } qw(pl perl pm)), # perhaps also 'cgi'
287 (map { $_ => 'make'} qw(make mak mk)),
288 (map { $_ => 'xml' } qw(xml xhtml html htm)),
61bf126e
AS
Alejandro R. Sedeño2010-07-28 14:40:53 -0400289);
290
ddb8d900
AK
Aneesh Kumar K.V2006-08-20 11:53:04 +0530291# You define site-wide feature defaults here; override them with
292# $GITWEB_CONFIG as necessary.
952c65fc Jakub Narębski2006-08-22 16:52:50 +0200293our %feature = (
17848fc6
JN
Jakub Narębski2006-08-26 19:14:22 +0200294 # feature => {
295 # 'sub' => feature-sub (subroutine),
296 # 'override' => allow-override (boolean),
297 # 'default' => [ default options...] (array reference)}
298 #
b4b20b21 Jakub Narębski2007-05-15 01:55:44 +0200299 # if feature is overridable (it means that allow-override has true value),
17848fc6
JN
Jakub Narębski2006-08-26 19:14:22 +0200300 # then feature-sub will be called with default options as parameters;
301 # return value of feature-sub indicates if to enable specified feature
302 #
b4b20b21 Jakub Narębski2007-05-15 01:55:44 +0200303 # if there is no 'sub' key (no feature-sub), then feature cannot be
22e5e58a Ralf Wildenhues2010-08-22 13:12:12 +0200304 # overridden
b4b20b21 Jakub Narębski2007-05-15 01:55:44 +0200305 #
ff3c0ff2
GB
Giuseppe Bilotta2008-12-02 14:57:28 -0800306 # use gitweb_get_feature(<feature>) to retrieve the <feature> value
307 # (an array) or gitweb_check_feature(<feature>) to check if <feature>
308 # is enabled
952c65fc Jakub Narębski2006-08-22 16:52:50 +0200309
45a3b12c
PB
Petr Baudis2006-10-07 15:17:47 +0200310 # Enable the 'blame' blob view, showing the last commit that modified
311 # each line in the file. This can be very CPU-intensive.
312
313 # To enable system wide have in $GITWEB_CONFIG
314 # $feature{'blame'}{'default'} = [1];
315 # To have project specific config enable override in $GITWEB_CONFIG
316 # $feature{'blame'}{'override'} = 1;
317 # and in project config gitweb.blame = 0|1;
952c65fc Jakub Narębski2006-08-22 16:52:50 +0200318 'blame' => {
cdad8170 Matt Kraai2008-12-15 22:16:19 -0800319 'sub' => sub { feature_bool('blame', @_) },
952c65fc
JN
Jakub Narębski2006-08-22 16:52:50 +0200320 'override' => 0,
321 'default' => [0]},
322
a3c8ab30 Matt McCutchen2007-07-22 01:30:27 +0200323 # Enable the 'snapshot' link, providing a compressed archive of any
45a3b12c
PB
Petr Baudis2006-10-07 15:17:47 +0200324 # tree. This can potentially generate high traffic if you have large
325 # project.
326
a3c8ab30
MM
Matt McCutchen2007-07-22 01:30:27 +0200327 # Value is a list of formats defined in %known_snapshot_formats that
328 # you wish to offer.
45a3b12c Petr Baudis2006-10-07 15:17:47 +0200329 # To disable system wide have in $GITWEB_CONFIG
a3c8ab30 Matt McCutchen2007-07-22 01:30:27 +0200330 # $feature{'snapshot'}{'default'} = [];
45a3b12c Petr Baudis2006-10-07 15:17:47 +0200331 # To have project specific config enable override in $GITWEB_CONFIG
bbee1d97 Uwe Kleine-König2006-12-08 12:44:31 +0100332 # $feature{'snapshot'}{'override'} = 1;
a3c8ab30
MM
Matt McCutchen2007-07-22 01:30:27 +0200333 # and in project config, a comma-separated list of formats or "none"
334 # to disable. Example: gitweb.snapshot = tbz2,zip;
952c65fc
JN
Jakub Narębski2006-08-22 16:52:50 +0200335 'snapshot' => {
336 'sub' => \&feature_snapshot,
337 'override' => 0,
a3c8ab30 Matt McCutchen2007-07-22 01:30:27 +0200338 'default' => ['tgz']},
04f7a94f Jakub Narębski2006-09-11 00:29:27 +0200339
6be93511
RF
Robert Fitzsimons2006-12-23 03:35:16 +0000340 # Enable text search, which will list the commits which match author,
341 # committer or commit text to a given string. Enabled by default.
b4b20b21 Jakub Narębski2007-05-15 01:55:44 +0200342 # Project specific override is not supported.
e0ca3645
JN
Jakub Narębski2011-06-22 17:28:52 +0200343 #
344 # Note that this controls all search features, which means that if
345 # it is disabled, then 'grep' and 'pickaxe' search would also be
346 # disabled.
6be93511
RF
Robert Fitzsimons2006-12-23 03:35:16 +0000347 'search' => {
348 'override' => 0,
349 'default' => [1]},
350
e7738553
PB
Petr Baudis2007-05-17 04:31:12 +0200351 # Enable grep search, which will list the files in currently selected
352 # tree containing the given string. Enabled by default. This can be
353 # potentially CPU-intensive, of course.
a598ded1 Jakub Narębski2011-06-21 08:41:16 +0200354 # Note that you need to have 'search' feature enabled too.
e7738553
PB
Petr Baudis2007-05-17 04:31:12 +0200355
356 # To enable system wide have in $GITWEB_CONFIG
357 # $feature{'grep'}{'default'} = [1];
358 # To have project specific config enable override in $GITWEB_CONFIG
359 # $feature{'grep'}{'override'} = 1;
360 # and in project config gitweb.grep = 0|1;
361 'grep' => {
cdad8170 Matt Kraai2008-12-15 22:16:19 -0800362 'sub' => sub { feature_bool('grep', @_) },
e7738553
PB
Petr Baudis2007-05-17 04:31:12 +0200363 'override' => 0,
364 'default' => [1]},
365
45a3b12c
PB
Petr Baudis2006-10-07 15:17:47 +0200366 # Enable the pickaxe search, which will list the commits that modified
367 # a given string in a file. This can be practical and quite faster
368 # alternative to 'blame', but still potentially CPU-intensive.
a598ded1 Jakub Narębski2011-06-21 08:41:16 +0200369 # Note that you need to have 'search' feature enabled too.
45a3b12c
PB
Petr Baudis2006-10-07 15:17:47 +0200370
371 # To enable system wide have in $GITWEB_CONFIG
372 # $feature{'pickaxe'}{'default'} = [1];
373 # To have project specific config enable override in $GITWEB_CONFIG
374 # $feature{'pickaxe'}{'override'} = 1;
375 # and in project config gitweb.pickaxe = 0|1;
04f7a94f Jakub Narębski2006-09-11 00:29:27 +0200376 'pickaxe' => {
cdad8170 Matt Kraai2008-12-15 22:16:19 -0800377 'sub' => sub { feature_bool('pickaxe', @_) },
04f7a94f
JN
Jakub Narębski2006-09-11 00:29:27 +0200378 'override' => 0,
379 'default' => [1]},
9e756904 Martin Waitz2006-10-01 23:57:48 +0200380
e4b48eaa
JN
Jakub Narębski2009-09-07 14:40:00 +0200381 # Enable showing size of blobs in a 'tree' view, in a separate
382 # column, similar to what 'ls -l' does. This cost a bit of IO.
383
384 # To disable system wide have in $GITWEB_CONFIG
385 # $feature{'show-sizes'}{'default'} = [0];
386 # To have project specific config enable override in $GITWEB_CONFIG
387 # $feature{'show-sizes'}{'override'} = 1;
388 # and in project config gitweb.showsizes = 0|1;
389 'show-sizes' => {
390 'sub' => sub { feature_bool('showsizes', @_) },
391 'override' => 0,
392 'default' => [1]},
393
45a3b12c
PB
Petr Baudis2006-10-07 15:17:47 +0200394 # Make gitweb use an alternative format of the URLs which can be
395 # more readable and natural-looking: project name is embedded
396 # directly in the path and the query string contains other
397 # auxiliary information. All gitweb installations recognize
398 # URL in either format; this configures in which formats gitweb
399 # generates links.
400
401 # To enable system wide have in $GITWEB_CONFIG
402 # $feature{'pathinfo'}{'default'} = [1];
403 # Project specific override is not supported.
404
405 # Note that you will need to change the default location of CSS,
406 # favicon, logo and possibly other files to an absolute URL. Also,
407 # if gitweb.cgi serves as your indexfile, you will need to force
408 # $my_uri to contain the script name in your $GITWEB_CONFIG.
9e756904
MW
Martin Waitz2006-10-01 23:57:48 +0200409 'pathinfo' => {
410 'override' => 0,
411 'default' => [0]},
e30496df
PB
Petr Baudis2006-10-24 05:33:17 +0200412
413 # Make gitweb consider projects in project root subdirectories
414 # to be forks of existing projects. Given project $projname.git,
415 # projects matching $projname/*.git will not be shown in the main
416 # projects list, instead a '+' mark will be added to $projname
417 # there and a 'forks' view will be enabled for the project, listing
c2b8b134
FL
Frank Lichtenheld2007-04-06 23:58:11 +0200418 # all the forks. If project list is taken from a file, forks have
419 # to be listed after the main project.
e30496df
PB
Petr Baudis2006-10-24 05:33:17 +0200420
421 # To enable system wide have in $GITWEB_CONFIG
422 # $feature{'forks'}{'default'} = [1];
423 # Project specific override is not supported.
424 'forks' => {
425 'override' => 0,
426 'default' => [0]},
d627f68f
PB
Petr Baudis2008-10-02 16:36:52 +0200427
428 # Insert custom links to the action bar of all project pages.
429 # This enables you mainly to link to third-party scripts integrating
430 # into gitweb; e.g. git-browser for graphical history representation
431 # or custom web-based repository administration interface.
432
433 # The 'default' value consists of a list of triplets in the form
434 # (label, link, position) where position is the label after which
2b11e059 Jakub Narębski2008-10-12 00:02:32 +0200435 # to insert the link and link is a format string where %n expands
d627f68f
PB
Petr Baudis2008-10-02 16:36:52 +0200436 # to the project name, %f to the project path within the filesystem,
437 # %h to the current hash (h gitweb parameter) and %b to the current
2b11e059 Jakub Narębski2008-10-12 00:02:32 +0200438 # hash base (hb gitweb parameter); %% expands to %.
d627f68f
PB
Petr Baudis2008-10-02 16:36:52 +0200439
440 # To enable system wide have in $GITWEB_CONFIG e.g.
441 # $feature{'actions'}{'default'} = [('graphiclog',
442 # '/git-browser/by-commit.html?r=%n', 'summary')];
443 # Project specific override is not supported.
444 'actions' => {
445 'override' => 0,
446 'default' => []},
3e3d4ee7 Shawn O. Pearce2008-10-03 07:41:25 -0700447
0368c492
JN
Jakub Narębski2011-04-29 19:51:57 +0200448 # Allow gitweb scan project content tags of project repository,
449 # and display the popular Web 2.0-ish "tag cloud" near the projects
450 # list. Note that this is something COMPLETELY different from the
451 # normal Git tags.
aed93de4
PB
Petr Baudis2008-10-02 17:13:02 +0200452
453 # gitweb by itself can show existing tags, but it does not handle
0368c492
JN
Jakub Narębski2011-04-29 19:51:57 +0200454 # tagging itself; you need to do it externally, outside gitweb.
455 # The format is described in git_get_project_ctags() subroutine.
aed93de4
PB
Petr Baudis2008-10-02 17:13:02 +0200456 # You may want to install the HTML::TagCloud Perl module to get
457 # a pretty tag cloud instead of just a list of tags.
458
459 # To enable system wide have in $GITWEB_CONFIG
0368c492 Jakub Narębski2011-04-29 19:51:57 +0200460 # $feature{'ctags'}{'default'} = [1];
aed93de4 Petr Baudis2008-10-02 17:13:02 +0200461 # Project specific override is not supported.
0368c492
JN
Jakub Narębski2011-04-29 19:51:57 +0200462
463 # In the future whether ctags editing is enabled might depend
464 # on the value, but using 1 should always mean no editing of ctags.
aed93de4
PB
Petr Baudis2008-10-02 17:13:02 +0200465 'ctags' => {
466 'override' => 0,
467 'default' => [0]},
9872cd6f
GB
Giuseppe Bilotta2008-12-18 08:13:16 +0100468
469 # The maximum number of patches in a patchset generated in patch
470 # view. Set this to 0 or undef to disable patch view, or to a
471 # negative number to remove any limit.
472
473 # To disable system wide have in $GITWEB_CONFIG
474 # $feature{'patches'}{'default'} = [0];
475 # To have project specific config enable override in $GITWEB_CONFIG
476 # $feature{'patches'}{'override'} = 1;
477 # and in project config gitweb.patches = 0|n;
478 # where n is the maximum number of patches allowed in a patchset.
479 'patches' => {
480 'sub' => \&feature_patches,
481 'override' => 0,
482 'default' => [16]},
e9fdd74e
GB
Giuseppe Bilotta2009-06-30 00:00:51 +0200483
484 # Avatar support. When this feature is enabled, views such as
485 # shortlog or commit will display an avatar associated with
486 # the email of the committer(s) and/or author(s).
487
679a1a1d
GB
Giuseppe Bilotta2009-06-30 00:00:53 +0200488 # Currently available providers are gravatar and picon.
489 # If an unknown provider is specified, the feature is disabled.
490
491 # Gravatar depends on Digest::MD5.
492 # Picon currently relies on the indiana.edu database.
e9fdd74e
GB
Giuseppe Bilotta2009-06-30 00:00:51 +0200493
494 # To enable system wide have in $GITWEB_CONFIG
679a1a1d
GB
Giuseppe Bilotta2009-06-30 00:00:53 +0200495 # $feature{'avatar'}{'default'} = ['<provider>'];
496 # where <provider> is either gravatar or picon.
e9fdd74e
GB
Giuseppe Bilotta2009-06-30 00:00:51 +0200497 # To have project specific config enable override in $GITWEB_CONFIG
498 # $feature{'avatar'}{'override'} = 1;
679a1a1d Giuseppe Bilotta2009-06-30 00:00:53 +0200499 # and in project config gitweb.avatar = <provider>;
e9fdd74e
GB
Giuseppe Bilotta2009-06-30 00:00:51 +0200500 'avatar' => {
501 'sub' => \&feature_avatar,
502 'override' => 0,
503 'default' => ['']},
aa7dd05e
JN
Jakub Narębski2009-09-01 13:39:16 +0200504
505 # Enable displaying how much time and how many git commands
506 # it took to generate and display page. Disabled by default.
507 # Project specific override is not supported.
508 'timed' => {
509 'override' => 0,
510 'default' => [0]},
e627e50a
JN
Jakub Narębski2009-11-26 21:12:15 +0100511
512 # Enable turning some links into links to actions which require
513 # JavaScript to run (like 'blame_incremental'). Not enabled by
514 # default. Project specific override is currently not supported.
515 'javascript-actions' => {
516 'override' => 0,
517 'default' => [0]},
b331fe54 Johannes Schindelin2010-04-27 21:34:44 +0200518
2e987f92
JN
Jakub Narębski2011-04-28 21:04:11 +0200519 # Enable and configure ability to change common timezone for dates
520 # in gitweb output via JavaScript. Enabled by default.
521 # Project specific override is not supported.
522 'javascript-timezone' => {
523 'override' => 0,
524 'default' => [
525 'local', # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
526 # or undef to turn off this feature
527 'gitweb_tz', # name of cookie where to store selected timezone
528 'datetime', # CSS class used to mark up dates for manipulation
529 ]},
530
b331fe54
JS
Johannes Schindelin2010-04-27 21:34:44 +0200531 # Syntax highlighting support. This is based on Daniel Svensson's
532 # and Sham Chukoury's work in gitweb-xmms2.git.
592ea417
JN
Jakub Narębski2010-04-27 21:34:45 +0200533 # It requires the 'highlight' program present in $PATH,
534 # and therefore is disabled by default.
b331fe54
JS
Johannes Schindelin2010-04-27 21:34:44 +0200535
536 # To enable system wide have in $GITWEB_CONFIG
537 # $feature{'highlight'}{'default'} = [1];
538
539 'highlight' => {
540 'sub' => sub { feature_bool('highlight', @_) },
541 'override' => 0,
542 'default' => [0]},
60efa245
GB
Giuseppe Bilotta2010-11-11 13:26:09 +0100543
544 # Enable displaying of remote heads in the heads list
545
546 # To enable system wide have in $GITWEB_CONFIG
547 # $feature{'remote_heads'}{'default'} = [1];
548 # To have project specific config enable override in $GITWEB_CONFIG
549 # $feature{'remote_heads'}{'override'} = 1;
af507944 Phil Pennock2012-11-05 18:50:47 -0500550 # and in project config gitweb.remoteheads = 0|1;
60efa245
GB
Giuseppe Bilotta2010-11-11 13:26:09 +0100551 'remote_heads' => {
552 'sub' => sub { feature_bool('remote_heads', @_) },
553 'override' => 0,
554 'default' => [0]},
8d646a9b
KN
Krzesimir Nowak2013-12-11 12:54:43 +0100555
556 # Enable showing branches under other refs in addition to heads
557
558 # To set system wide extra branch refs have in $GITWEB_CONFIG
559 # $feature{'extra-branch-refs'}{'default'} = ['dirs', 'of', 'choice'];
560 # To have project specific config enable override in $GITWEB_CONFIG
561 # $feature{'extra-branch-refs'}{'override'} = 1;
562 # and in project config gitweb.extrabranchrefs = dirs of choice
563 # Every directory is separated with whitespace.
564
565 'extra-branch-refs' => {
566 'sub' => \&feature_extra_branch_refs,
567 'override' => 0,
568 'default' => []},
ddb8d900
AK
Aneesh Kumar K.V2006-08-20 11:53:04 +0530569);
570
a7c5a283 Junio C Hamano2008-11-29 13:02:08 -0800571sub gitweb_get_feature {
ddb8d900 Aneesh Kumar K.V2006-08-20 11:53:04 +0530572 my ($name) = @_;
dd1ad5f1 Jakub Narębski2006-09-26 01:56:17 +0200573 return unless exists $feature{$name};
952c65fc
JN
Jakub Narębski2006-08-22 16:52:50 +0200574 my ($sub, $override, @defaults) = (
575 $feature{$name}{'sub'},
576 $feature{$name}{'override'},
577 @{$feature{$name}{'default'}});
9be3614e
JN
Jakub Narębski2010-03-01 22:51:34 +0100578 # project specific override is possible only if we have project
579 our $git_dir; # global variable, declared later
580 if (!$override || !defined $git_dir) {
581 return @defaults;
582 }
a9455919 Martin Waitz2006-10-03 20:07:43 +0200583 if (!defined $sub) {
93197898 Nanako Shiraishi2009-08-28 12:18:49 +0900584 warn "feature $name is not overridable";
a9455919
MW
Martin Waitz2006-10-03 20:07:43 +0200585 return @defaults;
586 }
ddb8d900
AK
Aneesh Kumar K.V2006-08-20 11:53:04 +0530587 return $sub->(@defaults);
588}
589
25b2790f
GB
Giuseppe Bilotta2008-11-29 13:07:29 -0800590# A wrapper to check if a given feature is enabled.
591# With this, you can say
592#
593# my $bool_feat = gitweb_check_feature('bool_feat');
594# gitweb_check_feature('bool_feat') or somecode;
595#
596# instead of
597#
598# my ($bool_feat) = gitweb_get_feature('bool_feat');
599# (gitweb_get_feature('bool_feat'))[0] or somecode;
600#
601sub gitweb_check_feature {
602 return (gitweb_get_feature(@_))[0];
603}
604
605
cdad8170
MK
Matt Kraai2008-12-15 22:16:19 -0800606sub feature_bool {
607 my $key = shift;
608 my ($val) = git_get_project_config($key, '--bool');
ddb8d900 Aneesh Kumar K.V2006-08-20 11:53:04 +0530609
df5d10a3
MC
Marcel M. Cary2009-02-18 14:09:41 +0100610 if (!defined $val) {
611 return ($_[0]);
612 } elsif ($val eq 'true') {
cdad8170 Matt Kraai2008-12-15 22:16:19 -0800613 return (1);
ddb8d900 Aneesh Kumar K.V2006-08-20 11:53:04 +0530614 } elsif ($val eq 'false') {
cdad8170 Matt Kraai2008-12-15 22:16:19 -0800615 return (0);
ddb8d900 Aneesh Kumar K.V2006-08-20 11:53:04 +0530616 }
ddb8d900
AK
Aneesh Kumar K.V2006-08-20 11:53:04 +0530617}
618
ddb8d900 Aneesh Kumar K.V2006-08-20 11:53:04 +0530619sub feature_snapshot {
a3c8ab30 Matt McCutchen2007-07-22 01:30:27 +0200620 my (@fmts) = @_;
ddb8d900
AK
Aneesh Kumar K.V2006-08-20 11:53:04 +0530621
622 my ($val) = git_get_project_config('snapshot');
623
a3c8ab30
MM
Matt McCutchen2007-07-22 01:30:27 +0200624 if ($val) {
625 @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
ddb8d900
AK
Aneesh Kumar K.V2006-08-20 11:53:04 +0530626 }
627
a3c8ab30 Matt McCutchen2007-07-22 01:30:27 +0200628 return @fmts;
de9272f4
LT
Luben Tuikov2006-09-28 16:49:21 -0700629}
630
9872cd6f
GB
Giuseppe Bilotta2008-12-18 08:13:16 +0100631sub feature_patches {
632 my @val = (git_get_project_config('patches', '--int'));
633
634 if (@val) {
635 return @val;
636 }
637
638 return ($_[0]);
639}
640
e9fdd74e
GB
Giuseppe Bilotta2009-06-30 00:00:51 +0200641sub feature_avatar {
642 my @val = (git_get_project_config('avatar'));
643
644 return @val ? @val : @_;
645}
646
8d646a9b
KN
Krzesimir Nowak2013-12-11 12:54:43 +0100647sub feature_extra_branch_refs {
648 my (@branch_refs) = @_;
649 my $values = git_get_project_config('extrabranchrefs');
650
651 if ($values) {
652 $values = config_to_multi ($values);
653 @branch_refs = ();
654 foreach my $value (@{$values}) {
655 push @branch_refs, split /\s+/, $value;
656 }
657 }
658
659 return @branch_refs;
660}
661
2172ce4b
JH
Junio C Hamano2006-10-03 02:30:47 -0700662# checking HEAD file with -e is fragile if the repository was
663# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
664# and then pruned.
665sub check_head_link {
666 my ($dir) = @_;
667 my $headfile = "$dir/HEAD";
668 return ((-e $headfile) ||
669 (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
670}
671
672sub check_export_ok {
673 my ($dir) = @_;
674 return (check_head_link($dir) &&
dd7f5f10
AG
Alexander Gavrilov2008-11-06 01:36:23 +0300675 (!$export_ok || -e "$dir/$export_ok") &&
676 (!$export_auth_hook || $export_auth_hook->($dir)));
2172ce4b
JH
Junio C Hamano2006-10-03 02:30:47 -0700677}
678
a781785d
JN
Jakub Narębski2007-07-22 23:41:20 +0200679# process alternate names for backward compatibility
680# filter out unsupported (unknown) snapshot formats
681sub filter_snapshot_fmts {
682 my @fmts = @_;
683
684 @fmts = map {
685 exists $known_snapshot_format_aliases{$_} ?
686 $known_snapshot_format_aliases{$_} : $_} @fmts;
68cedb1f Jakub Narębski2009-05-10 02:40:37 +0200687 @fmts = grep {
1bfd3631
MR
Mark Rada2009-08-06 10:25:39 -0400688 exists $known_snapshot_formats{$_} &&
689 !$known_snapshot_formats{$_}{'disabled'}} @fmts;
a781785d
JN
Jakub Narębski2007-07-22 23:41:20 +0200690}
691
8d646a9b
KN
Krzesimir Nowak2013-12-11 12:54:43 +0100692sub filter_and_validate_refs {
693 my @refs = @_;
694 my %unique_refs = ();
695
696 foreach my $ref (@refs) {
697 die_error(500, "Invalid ref '$ref' in 'extra-branch-refs' feature") unless (is_valid_ref_format($ref));
698 # 'heads' are added implicitly in get_branch_refs().
699 $unique_refs{$ref} = 1 if ($ref ne 'heads');
700 }
701 return sort keys %unique_refs;
702}
703
da4b2432
JN
Jakub Narębski2010-11-25 19:43:59 +0100704# If it is set to code reference, it is code that it is to be run once per
705# request, allowing updating configurations that change with each request,
706# while running other code in config file only once.
707#
708# Otherwise, if it is false then gitweb would process config file only once;
709# if it is true then gitweb config would be run for each request.
710our $per_request_config = 1;
711
f612a71c
JN
Jakub Narębski2011-05-25 18:35:26 +0200712# read and parse gitweb config file given by its parameter.
713# returns true on success, false on recoverable error, allowing
714# to chain this subroutine, using first file that exists.
715# dies on errors during parsing config file, as it is unrecoverable.
716sub read_config_file {
717 my $filename = shift;
718 return unless defined $filename;
719 # die if there are errors parsing config file
720 if (-e $filename) {
721 do $filename;
722 die $@ if $@;
723 return 1;
724 }
725 return;
726}
727
131d6afc Jakub Narębski2011-07-25 00:29:18 +0200728our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +0200729sub evaluate_gitweb_config {
730 our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
731 our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
131d6afc Jakub Narębski2011-07-25 00:29:18 +0200732 our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
f612a71c Jakub Narębski2011-05-25 18:35:26 +0200733
41ccfdd9 Stefano Lattarini2013-04-12 00:36:10 +0200734 # Protect against duplications of file names, to not read config twice.
131d6afc
JN
Jakub Narębski2011-07-25 00:29:18 +0200735 # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
736 # there possibility of duplication of filename there doesn't matter.
737 $GITWEB_CONFIG = "" if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
738 $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
739
740 # Common system-wide settings for convenience.
741 # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
742 read_config_file($GITWEB_CONFIG_COMMON);
743
744 # Use first config file that exists. This means use the per-instance
745 # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
746 read_config_file($GITWEB_CONFIG) and return;
f612a71c Jakub Narębski2011-05-25 18:35:26 +0200747 read_config_file($GITWEB_CONFIG_SYSTEM);
17a8b250 Gerrit Pape2008-03-26 18:11:19 +0000748}
c8d138a8 Jeff King2006-08-02 15:23:34 -0400749
b62a1a98
JWH
John 'Warthog9' Hawley2010-01-30 23:30:39 +0100750# Get loadavg of system, to compare against $maxload.
751# Currently it requires '/proc/loadavg' present to get loadavg;
752# if it is not present it returns 0, which means no load checking.
753sub get_loadavg {
754 if( -e '/proc/loadavg' ){
755 open my $fd, '<', '/proc/loadavg'
756 or return 0;
757 my @load = split(/\s+/, scalar <$fd>);
758 close $fd;
759
760 # The first three columns measure CPU and IO utilization of the last one,
761 # five, and 10 minute periods. The fourth column shows the number of
762 # currently running processes and the total number of processes in the m/n
763 # format. The last column displays the last process ID used.
764 return $load[0] || 0;
765 }
766 # additional checks for load average should go here for things that don't export
767 # /proc/loadavg
768
769 return 0;
770}
771
c8d138a8 Jeff King2006-08-02 15:23:34 -0400772# version of the core git binary
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +0200773our $git_version;
774sub evaluate_git_version {
775 our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
776 $number_of_git_cmds++;
777}
c8d138a8 Jeff King2006-08-02 15:23:34 -0400778
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +0200779sub check_loadavg {
780 if (defined $maxload && get_loadavg() > $maxload) {
781 die_error(503, "The load average on the server is too high");
782 }
b62a1a98
JWH
John 'Warthog9' Hawley2010-01-30 23:30:39 +0100783}
784
154b4d78 Jakub Narębski2006-08-05 12:55:20 +0200785# ======================================================================
09bd7898 Kay Sievers2005-08-07 20:21:23 +0200786# input validation and dispatch
1b2d297e
GB
Giuseppe Bilotta2008-10-10 20:42:26 +0200787
788# input parameters can be collected from a variety of sources (presently, CGI
789# and PATH_INFO), so we define an %input_params hash that collects them all
790# together during validation: this allows subsequent uses (e.g. href()) to be
791# agnostic of the parameter origin
792
dde80d9c Alexander Gavrilov2008-11-06 01:10:07 +0300793our %input_params = ();
1b2d297e
GB
Giuseppe Bilotta2008-10-10 20:42:26 +0200794
795# input parameters are stored with the long parameter name as key. This will
796# also be used in the href subroutine to convert parameters to their CGI
797# equivalent, and since the href() usage is the most frequent one, we store
798# the name -> CGI key mapping here, instead of the reverse.
799#
800# XXX: Warning: If you touch this, check the search form for updating,
801# too.
802
dde80d9c Alexander Gavrilov2008-11-06 01:10:07 +0300803our @cgi_param_mapping = (
1b2d297e
GB
Giuseppe Bilotta2008-10-10 20:42:26 +0200804 project => "p",
805 action => "a",
806 file_name => "f",
807 file_parent => "fp",
808 hash => "h",
809 hash_parent => "hp",
810 hash_base => "hb",
811 hash_parent_base => "hpb",
812 page => "pg",
813 order => "o",
814 searchtext => "s",
815 searchtype => "st",
816 snapshot_format => "sf",
817 extra_options => "opt",
818 search_use_regexp => "sr",
0368c492 Jakub Narębski2011-04-29 19:51:57 +0200819 ctag => "by_tag",
6ba1eb51 Kato Kazuyoshi2011-10-31 00:36:22 +0100820 diff_style => "ds",
19d2d239 Bernhard R. Link2012-01-30 21:07:37 +0100821 project_filter => "pf",
c4ccf61f
JN
Jakub Narębski2009-09-01 13:39:19 +0200822 # this must be last entry (for manipulation from JavaScript)
823 javascript => "js"
1b2d297e Giuseppe Bilotta2008-10-10 20:42:26 +0200824);
dde80d9c Alexander Gavrilov2008-11-06 01:10:07 +0300825our %cgi_param_mapping = @cgi_param_mapping;
1b2d297e
GB
Giuseppe Bilotta2008-10-10 20:42:26 +0200826
827# we will also need to know the possible actions, for validation
dde80d9c Alexander Gavrilov2008-11-06 01:10:07 +0300828our %actions = (
1b2d297e Giuseppe Bilotta2008-10-10 20:42:26 +0200829 "blame" => \&git_blame,
4af819d4
JN
Jakub Narębski2009-09-01 13:39:17 +0200830 "blame_incremental" => \&git_blame_incremental,
831 "blame_data" => \&git_blame_data,
1b2d297e
GB
Giuseppe Bilotta2008-10-10 20:42:26 +0200832 "blobdiff" => \&git_blobdiff,
833 "blobdiff_plain" => \&git_blobdiff_plain,
834 "blob" => \&git_blob,
835 "blob_plain" => \&git_blob_plain,
836 "commitdiff" => \&git_commitdiff,
837 "commitdiff_plain" => \&git_commitdiff_plain,
838 "commit" => \&git_commit,
839 "forks" => \&git_forks,
840 "heads" => \&git_heads,
841 "history" => \&git_history,
842 "log" => \&git_log,
9872cd6f Giuseppe Bilotta2008-12-18 08:13:16 +0100843 "patch" => \&git_patch,
a3411f8a Giuseppe Bilotta2008-12-18 08:13:18 +0100844 "patches" => \&git_patches,
00fa6fef Giuseppe Bilotta2010-11-11 13:26:11 +0100845 "remotes" => \&git_remotes,
1b2d297e
GB
Giuseppe Bilotta2008-10-10 20:42:26 +0200846 "rss" => \&git_rss,
847 "atom" => \&git_atom,
848 "search" => \&git_search,
849 "search_help" => \&git_search_help,
850 "shortlog" => \&git_shortlog,
851 "summary" => \&git_summary,
852 "tag" => \&git_tag,
853 "tags" => \&git_tags,
854 "tree" => \&git_tree,
855 "snapshot" => \&git_snapshot,
856 "object" => \&git_object,
857 # those below don't need $project
858 "opml" => \&git_opml,
859 "project_list" => \&git_project_list,
860 "project_index" => \&git_project_index,
861);
862
863# finally, we have the hash of allowed extra_options for the commands that
864# allow them
dde80d9c Alexander Gavrilov2008-11-06 01:10:07 +0300865our %allowed_options = (
1b2d297e
GB
Giuseppe Bilotta2008-10-10 20:42:26 +0200866 "--no-merges" => [ qw(rss atom log shortlog history) ],
867);
868
869# fill %input_params with the CGI parameters. All values except for 'opt'
870# should be single values, but opt can be an array. We should probably
871# build an array of parameters that can be multi-valued, but since for the time
872# being it's only this one, we just single it out
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +0200873sub evaluate_query_params {
874 our $cgi;
875
876 while (my ($name, $symbol) = each %cgi_param_mapping) {
877 if ($symbol eq 'opt') {
13dbf46a Jeff King2014-11-18 12:10:22 -0500878 $input_params{$name} = [ map { decode_utf8($_) } $cgi->multi_param($symbol) ];
c2394fe9 Jakub Narębski2010-05-07 14:54:04 +0200879 } else {
84d9e2d5 Jakub Narębski2012-02-03 13:44:54 +0100880 $input_params{$name} = decode_utf8($cgi->param($symbol));
c2394fe9 Jakub Narębski2010-05-07 14:54:04 +0200881 }
1b2d297e
GB
Giuseppe Bilotta2008-10-10 20:42:26 +0200882 }
883}
884
885# now read PATH_INFO and update the parameter list for missing parameters
886sub evaluate_path_info {
887 return if defined $input_params{'project'};
888 return if !$path_info;
889 $path_info =~ s,^/+,,;
890 return if !$path_info;
891
892 # find which part of PATH_INFO is project
893 my $project = $path_info;
894 $project =~ s,/+$,,;
895 while ($project && !check_head_link("$projectroot/$project")) {
896 $project =~ s,/*[^/]*$,,;
897 }
898 return unless $project;
899 $input_params{'project'} = $project;
900
901 # do not change any parameters if an action is given using the query string
902 return if $input_params{'action'};
903 $path_info =~ s,^\Q$project\E/*,,;
904
d8c28822
GB
Giuseppe Bilotta2008-10-21 21:34:50 +0200905 # next, check if we have an action
906 my $action = $path_info;
907 $action =~ s,/.*$,,;
908 if (exists $actions{$action}) {
909 $path_info =~ s,^$action/*,,;
910 $input_params{'action'} = $action;
911 }
912
913 # list of actions that want hash_base instead of hash, but can have no
914 # pathname (f) parameter
915 my @wants_base = (
916 'tree',
917 'history',
918 );
919
7e00dc58 Jakub Narębski2010-10-13 13:33:48 +0200920 # we want to catch, among others
b0be3838
GB
Giuseppe Bilotta2008-10-21 21:34:53 +0200921 # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
922 my ($parentrefname, $parentpathname, $refname, $pathname) =
7e00dc58 Jakub Narębski2010-10-13 13:33:48 +0200923 ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
b0be3838
GB
Giuseppe Bilotta2008-10-21 21:34:53 +0200924
925 # first, analyze the 'current' part
1b2d297e Giuseppe Bilotta2008-10-10 20:42:26 +0200926 if (defined $pathname) {
d8c28822
GB
Giuseppe Bilotta2008-10-21 21:34:50 +0200927 # we got "branch:filename" or "branch:dir/"
928 # we could use git_get_type(branch:pathname), but:
929 # - it needs $git_dir
930 # - it does a git() call
931 # - the convention of terminating directories with a slash
932 # makes it superfluous
933 # - embedding the action in the PATH_INFO would make it even
934 # more superfluous
1b2d297e
GB
Giuseppe Bilotta2008-10-10 20:42:26 +0200935 $pathname =~ s,^/+,,;
936 if (!$pathname || substr($pathname, -1) eq "/") {
d8c28822 Giuseppe Bilotta2008-10-21 21:34:50 +0200937 $input_params{'action'} ||= "tree";
1b2d297e
GB
Giuseppe Bilotta2008-10-10 20:42:26 +0200938 $pathname =~ s,/$,,;
939 } else {
b0be3838
GB
Giuseppe Bilotta2008-10-21 21:34:53 +0200940 # the default action depends on whether we had parent info
941 # or not
942 if ($parentrefname) {
943 $input_params{'action'} ||= "blobdiff_plain";
944 } else {
945 $input_params{'action'} ||= "blob_plain";
946 }
1b2d297e
GB
Giuseppe Bilotta2008-10-10 20:42:26 +0200947 }
948 $input_params{'hash_base'} ||= $refname;
949 $input_params{'file_name'} ||= $pathname;
950 } elsif (defined $refname) {
d8c28822
GB
Giuseppe Bilotta2008-10-21 21:34:50 +0200951 # we got "branch". In this case we have to choose if we have to
952 # set hash or hash_base.
953 #
954 # Most of the actions without a pathname only want hash to be
955 # set, except for the ones specified in @wants_base that want
956 # hash_base instead. It should also be noted that hand-crafted
957 # links having 'history' as an action and no pathname or hash
958 # set will fail, but that happens regardless of PATH_INFO.
d0af3734
JN
Jakub Narębski2010-10-13 13:35:20 +0200959 if (defined $parentrefname) {
960 # if there is parent let the default be 'shortlog' action
961 # (for http://git.example.com/repo.git/A..B links); if there
962 # is no parent, dispatch will detect type of object and set
963 # action appropriately if required (if action is not set)
964 $input_params{'action'} ||= "shortlog";
965 }
966 if ($input_params{'action'} &&
967 grep { $_ eq $input_params{'action'} } @wants_base) {
d8c28822
GB
Giuseppe Bilotta2008-10-21 21:34:50 +0200968 $input_params{'hash_base'} ||= $refname;
969 } else {
970 $input_params{'hash'} ||= $refname;
971 }
1b2d297e Giuseppe Bilotta2008-10-10 20:42:26 +0200972 }
b0be3838
GB
Giuseppe Bilotta2008-10-21 21:34:53 +0200973
974 # next, handle the 'parent' part, if present
975 if (defined $parentrefname) {
976 # a missing pathspec defaults to the 'current' filename, allowing e.g.
977 # someproject/blobdiff/oldrev..newrev:/filename
978 if ($parentpathname) {
979 $parentpathname =~ s,^/+,,;
980 $parentpathname =~ s,/$,,;
981 $input_params{'file_parent'} ||= $parentpathname;
982 } else {
983 $input_params{'file_parent'} ||= $input_params{'file_name'};
984 }
985 # we assume that hash_parent_base is wanted if a path was specified,
986 # or if the action wants hash_base instead of hash
987 if (defined $input_params{'file_parent'} ||
988 grep { $_ eq $input_params{'action'} } @wants_base) {
989 $input_params{'hash_parent_base'} ||= $parentrefname;
990 } else {
991 $input_params{'hash_parent'} ||= $parentrefname;
992 }
993 }
1ec2fb5f
GB
Giuseppe Bilotta2008-11-02 10:21:38 +0100994
995 # for the snapshot action, we allow URLs in the form
996 # $project/snapshot/$hash.ext
997 # where .ext determines the snapshot and gets removed from the
998 # passed $refname to provide the $hash.
999 #
1000 # To be able to tell that $refname includes the format extension, we
1001 # require the following two conditions to be satisfied:
1002 # - the hash input parameter MUST have been set from the $refname part
1003 # of the URL (i.e. they must be equal)
1004 # - the snapshot format MUST NOT have been defined already (e.g. from
1005 # CGI parameter sf)
1006 # It's also useless to try any matching unless $refname has a dot,
1007 # so we check for that too
1008 if (defined $input_params{'action'} &&
1009 $input_params{'action'} eq 'snapshot' &&
1010 defined $refname && index($refname, '.') != -1 &&
1011 $refname eq $input_params{'hash'} &&
1012 !defined $input_params{'snapshot_format'}) {
1013 # We loop over the known snapshot formats, checking for
1014 # extensions. Allowed extensions are both the defined suffix
1015 # (which includes the initial dot already) and the snapshot
1016 # format key itself, with a prepended dot
ccb4b539 Holger Weiß2009-03-31 18:16:36 +02001017 while (my ($fmt, $opt) = each %known_snapshot_formats) {
1ec2fb5f Giuseppe Bilotta2008-11-02 10:21:38 +01001018 my $hash = $refname;
095e9142
JN
Jakub Narębski2009-05-11 19:42:47 +02001019 unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
1020 next;
1021 }
1022 my $sfx = $1;
1ec2fb5f
GB
Giuseppe Bilotta2008-11-02 10:21:38 +01001023 # a valid suffix was found, so set the snapshot format
1024 # and reset the hash parameter
1025 $input_params{'snapshot_format'} = $fmt;
1026 $input_params{'hash'} = $hash;
1027 # we also set the format suffix to the one requested
1028 # in the URL: this way a request for e.g. .tgz returns
1029 # a .tgz instead of a .tar.gz
1030 $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
1031 last;
1032 }
1033 }
1b2d297e Giuseppe Bilotta2008-10-10 20:42:26 +02001034}
1b2d297e Giuseppe Bilotta2008-10-10 20:42:26 +02001035
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001036our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
1037 $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
19d2d239 Bernhard R. Link2012-01-30 21:07:37 +01001038 $searchtext, $search_regexp, $project_filter);
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001039sub evaluate_and_validate_params {
1040 our $action = $input_params{'action'};
1041 if (defined $action) {
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001042 if (!is_valid_action($action)) {
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001043 die_error(400, "Invalid action parameter");
1044 }
b87d78d6 Kay Sievers2005-08-07 20:21:04 +02001045 }
44ad2978 Kay Sievers2005-08-07 19:59:24 +02001046
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001047 # parameters which are pathnames
1048 our $project = $input_params{'project'};
1049 if (defined $project) {
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001050 if (!is_valid_project($project)) {
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001051 undef $project;
1052 die_error(404, "No such project");
1053 }
9cd3d988 Kay Sievers2005-08-07 20:17:42 +02001054 }
6191f8e1 Kay Sievers2005-08-07 20:19:56 +02001055
19d2d239
BL
Bernhard R. Link2012-01-30 21:07:37 +01001056 our $project_filter = $input_params{'project_filter'};
1057 if (defined $project_filter) {
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001058 if (!is_valid_pathname($project_filter)) {
19d2d239
BL
Bernhard R. Link2012-01-30 21:07:37 +01001059 die_error(404, "Invalid project_filter parameter");
1060 }
1061 }
1062
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001063 our $file_name = $input_params{'file_name'};
1064 if (defined $file_name) {
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001065 if (!is_valid_pathname($file_name)) {
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001066 die_error(400, "Invalid file parameter");
1067 }
24d0693a Jakub Narębski2006-09-26 01:57:02 +02001068 }
24d0693a Jakub Narębski2006-09-26 01:57:02 +02001069
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001070 our $file_parent = $input_params{'file_parent'};
1071 if (defined $file_parent) {
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001072 if (!is_valid_pathname($file_parent)) {
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001073 die_error(400, "Invalid file parent parameter");
1074 }
24d0693a Jakub Narębski2006-09-26 01:57:02 +02001075 }
5c95fab0 Martin Waitz2006-08-17 00:28:38 +02001076
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001077 # parameters which are refnames
1078 our $hash = $input_params{'hash'};
1079 if (defined $hash) {
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001080 if (!is_valid_refname($hash)) {
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001081 die_error(400, "Invalid hash parameter");
1082 }
4fac5294 Kay Sievers2005-08-07 20:27:38 +02001083 }
6191f8e1 Kay Sievers2005-08-07 20:19:56 +02001084
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001085 our $hash_parent = $input_params{'hash_parent'};
1086 if (defined $hash_parent) {
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001087 if (!is_valid_refname($hash_parent)) {
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001088 die_error(400, "Invalid hash parent parameter");
1089 }
c91da262 Kay Sievers2005-09-03 14:50:33 +02001090 }
09bd7898 Kay Sievers2005-08-07 20:21:23 +02001091
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001092 our $hash_base = $input_params{'hash_base'};
1093 if (defined $hash_base) {
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001094 if (!is_valid_refname($hash_base)) {
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001095 die_error(400, "Invalid hash base parameter");
1096 }
c91da262 Kay Sievers2005-09-03 14:50:33 +02001097 }
6191f8e1 Kay Sievers2005-08-07 20:19:56 +02001098
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001099 our @extra_options = @{$input_params{'extra_options'}};
1100 # @extra_options is always defined, since it can only be (currently) set from
1101 # CGI, and $cgi->param() returns the empty array in array context if the param
1102 # is not set
1103 foreach my $opt (@extra_options) {
1104 if (not exists $allowed_options{$opt}) {
1105 die_error(400, "Invalid option parameter");
1106 }
1107 if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1108 die_error(400, "Invalid option parameter for this action");
1109 }
868bc068 Miklos Vajna2007-07-12 20:39:27 +02001110 }
868bc068 Miklos Vajna2007-07-12 20:39:27 +02001111
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001112 our $hash_parent_base = $input_params{'hash_parent_base'};
1113 if (defined $hash_parent_base) {
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001114 if (!is_valid_refname($hash_parent_base)) {
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001115 die_error(400, "Invalid hash parent base parameter");
1116 }
420e92f2 Jakub Narębski2006-08-24 23:53:54 +02001117 }
420e92f2 Jakub Narębski2006-08-24 23:53:54 +02001118
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001119 # other parameters
1120 our $page = $input_params{'page'};
1121 if (defined $page) {
1122 if ($page =~ m/[^0-9]/) {
1123 die_error(400, "Invalid page parameter");
1124 }
b87d78d6 Kay Sievers2005-08-07 20:21:04 +02001125 }
823d5dc8 Kay Sievers2005-08-07 19:57:58 +02001126
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001127 our $searchtype = $input_params{'searchtype'};
1128 if (defined $searchtype) {
1129 if ($searchtype =~ m/[^a-z]/) {
1130 die_error(400, "Invalid searchtype parameter");
1131 }
e7738553 Petr Baudis2007-05-17 04:31:12 +02001132 }
e7738553 Petr Baudis2007-05-17 04:31:12 +02001133
c2394fe9 Jakub Narębski2010-05-07 14:54:04 +02001134 our $search_use_regexp = $input_params{'search_use_regexp'};
0e559919 Petr Baudis2008-02-26 13:22:08 +01001135
c2394fe9 Jakub Narębski2010-05-07 14:54:04 +02001136 our $searchtext = $input_params{'searchtext'};
ca7a5dcf Charles McGarvey2013-06-04 22:44:28 -06001137 our $search_regexp = undef;
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001138 if (defined $searchtext) {
1139 if (length($searchtext) < 2) {
1140 die_error(403, "At least two characters are required for search parameter");
1141 }
36612e4d
JN
Jakub Narębski2012-02-28 19:41:47 +01001142 if ($search_use_regexp) {
1143 $search_regexp = $searchtext;
1144 if (!eval { qr/$search_regexp/; 1; }) {
1145 (my $error = $@) =~ s/ at \S+ line \d+.*\n?//;
1146 die_error(400, "Invalid search regexp '$search_regexp'",
1147 esc_html($error));
1148 }
1149 } else {
1150 $search_regexp = quotemeta $searchtext;
1151 }
9d032c72 Robert Fitzsimons2006-12-23 03:35:15 +00001152 }
19806691
KS
Kay Sievers2005-08-07 20:26:27 +02001153}
1154
645927ce
ML
Matthias Lederhofer2006-09-17 15:29:48 +02001155# path to the current git repository
1156our $git_dir;
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001157sub evaluate_git_dir {
1158 our $git_dir = "$projectroot/$project" if $project;
e9fdd74e
GB
Giuseppe Bilotta2009-06-30 00:00:51 +02001159}
1160
8d646a9b Krzesimir Nowak2013-12-11 12:54:43 +01001161our (@snapshot_fmts, $git_avatar, @extra_branch_refs);
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001162sub configure_gitweb_features {
1163 # list of supported snapshot formats
1164 our @snapshot_fmts = gitweb_get_feature('snapshot');
1165 @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1166
1167 # check that the avatar feature is set to a known provider name,
1168 # and for each provider check if the dependencies are satisfied.
1169 # if the provider name is invalid or the dependencies are not met,
1170 # reset $git_avatar to the empty string.
1171 our ($git_avatar) = gitweb_get_feature('avatar');
1172 if ($git_avatar eq 'gravatar') {
1173 $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1174 } elsif ($git_avatar eq 'picon') {
1175 # no dependencies
7f9778b1 Gerrit Pape2007-05-10 07:32:07 +00001176 } else {
c2394fe9 Jakub Narębski2010-05-07 14:54:04 +02001177 $git_avatar = '';
7f9778b1 Gerrit Pape2007-05-10 07:32:07 +00001178 }
8d646a9b
KN
Krzesimir Nowak2013-12-11 12:54:43 +01001179
1180 our @extra_branch_refs = gitweb_get_feature('extra-branch-refs');
1181 @extra_branch_refs = filter_and_validate_refs (@extra_branch_refs);
1182}
1183
1184sub get_branch_refs {
1185 return ('heads', @extra_branch_refs);
e9fdd74e
GB
Giuseppe Bilotta2009-06-30 00:00:51 +02001186}
1187
7a597457
JN
Jakub Narębski2010-04-24 16:00:04 +02001188# custom error handler: 'die <message>' is Internal Server Error
1189sub handle_errors_html {
1190 my $msg = shift; # it is already HTML escaped
1191
1192 # to avoid infinite loop where error occurs in die_error,
1193 # change handler to default handler, disabling handle_errors_html
41ccfdd9 Stefano Lattarini2013-04-12 00:36:10 +02001194 set_message("Error occurred when inside die_error:\n$msg");
7a597457
JN
Jakub Narębski2010-04-24 16:00:04 +02001195
1196 # you cannot jump out of die_error when called as error handler;
1197 # the subroutine set via CGI::Carp::set_message is called _after_
1198 # HTTP headers are already written, so it cannot write them itself
1199 die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1200}
1201set_message(\&handle_errors_html);
1202
717b8311 Jakub Narębski2006-07-31 21:22:15 +02001203# dispatch
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001204sub dispatch {
1205 if (!defined $action) {
1206 if (defined $hash) {
1207 $action = git_get_type($hash);
18ab83e8 Jakub Narębski2012-01-07 11:47:38 +01001208 $action or die_error(404, "Object does not exist");
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001209 } elsif (defined $hash_base && defined $file_name) {
1210 $action = git_get_type("$hash_base:$file_name");
18ab83e8 Jakub Narębski2012-01-07 11:47:38 +01001211 $action or die_error(404, "File or directory does not exist");
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001212 } elsif (defined $project) {
1213 $action = 'summary';
1214 } else {
1215 $action = 'project_list';
1216 }
7f9778b1 Gerrit Pape2007-05-10 07:32:07 +00001217 }
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001218 if (!defined($actions{$action})) {
1219 die_error(400, "Unknown action");
1220 }
1221 if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1222 !$project) {
1223 die_error(400, "Project needed");
1224 }
1225 $actions{$action}->();
77a153fd Jakub Narębski2006-08-22 16:59:20 +02001226}
c2394fe9 Jakub Narębski2010-05-07 14:54:04 +02001227
869d5881 Jakub Narębski2010-07-05 20:52:43 +02001228sub reset_timer {
3962f1d7 Jakub Narębski2010-11-09 19:27:54 +01001229 our $t0 = [ gettimeofday() ]
c2394fe9 Jakub Narębski2010-05-07 14:54:04 +02001230 if defined $t0;
869d5881
JN
Jakub Narębski2010-07-05 20:52:43 +02001231 our $number_of_git_cmds = 0;
1232}
1233
da4b2432 Jakub Narębski2010-11-25 19:43:59 +01001234our $first_request = 1;
869d5881
JN
Jakub Narębski2010-07-05 20:52:43 +02001235sub run_request {
1236 reset_timer();
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001237
1238 evaluate_uri();
da4b2432
JN
Jakub Narębski2010-11-25 19:43:59 +01001239 if ($first_request) {
1240 evaluate_gitweb_config();
1241 evaluate_git_version();
1242 }
1243 if ($per_request_config) {
1244 if (ref($per_request_config) eq 'CODE') {
1245 $per_request_config->();
1246 } elsif (!$first_request) {
1247 evaluate_gitweb_config();
1248 }
1249 }
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001250 check_loadavg();
1251
7f425db9
JN
Jonathan Nieder2010-07-30 22:01:59 -05001252 # $projectroot and $projects_list might be set in gitweb config file
1253 $projects_list ||= $projectroot;
1254
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001255 evaluate_query_params();
1256 evaluate_path_info();
1257 evaluate_and_validate_params();
1258 evaluate_git_dir();
1259
1260 configure_gitweb_features();
1261
1262 dispatch();
09bd7898 Kay Sievers2005-08-07 20:21:23 +02001263}
a0446e7b
SV
Sam Vilain2010-05-07 14:54:05 +02001264
1265our $is_last_request = sub { 1 };
1266our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1267our $CGI = 'CGI';
1268our $cgi;
45aa9895
JN
Jakub Narębski2010-06-05 23:11:18 +02001269sub configure_as_fcgi {
1270 require CGI::Fast;
1271 our $CGI = 'CGI::Fast';
1272
1273 my $request_number = 0;
1274 # let each child service 100 requests
1275 our $is_last_request = sub { ++$request_number > 100 };
d04d3d42 Jakub Narębski2006-09-19 21:53:22 +02001276}
a0446e7b Sam Vilain2010-05-07 14:54:05 +02001277sub evaluate_argv {
45aa9895
JN
Jakub Narębski2010-06-05 23:11:18 +02001278 my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1279 configure_as_fcgi()
1280 if $script_name =~ /\.fcgi$/;
1281
a0446e7b
SV
Sam Vilain2010-05-07 14:54:05 +02001282 return unless (@ARGV);
1283
1284 require Getopt::Long;
1285 Getopt::Long::GetOptions(
45aa9895 Jakub Narębski2010-06-05 23:11:18 +02001286 'fastcgi|fcgi|f' => \&configure_as_fcgi,
a0446e7b
SV
Sam Vilain2010-05-07 14:54:05 +02001287 'nproc|n=i' => sub {
1288 my ($arg, $val) = @_;
1289 return unless eval { require FCGI::ProcManager; 1; };
1290 my $proc_manager = FCGI::ProcManager->new({
1291 n_processes => $val,
1292 });
1293 our $pre_listen_hook = sub { $proc_manager->pm_manage() };
1294 our $pre_dispatch_hook = sub { $proc_manager->pm_pre_dispatch() };
1295 our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1296 },
1297 );
1298}
1299
1300sub run {
1301 evaluate_argv();
869d5881 Jakub Narębski2010-07-05 20:52:43 +02001302
da4b2432 Jakub Narębski2010-11-25 19:43:59 +01001303 $first_request = 1;
a0446e7b
SV
Sam Vilain2010-05-07 14:54:05 +02001304 $pre_listen_hook->()
1305 if $pre_listen_hook;
1306
1307 REQUEST:
1308 while ($cgi = $CGI->new()) {
1309 $pre_dispatch_hook->()
1310 if $pre_dispatch_hook;
1311
1312 run_request();
1313
0b45010e Jakub Narębski2010-08-02 22:21:47 +02001314 $post_dispatch_hook->()
a0446e7b Sam Vilain2010-05-07 14:54:05 +02001315 if $post_dispatch_hook;
da4b2432 Jakub Narębski2010-11-25 19:43:59 +01001316 $first_request = 0;
a0446e7b
SV
Sam Vilain2010-05-07 14:54:05 +02001317
1318 last REQUEST if ($is_last_request->());
1319 }
c2394fe9
JN
Jakub Narębski2010-05-07 14:54:04 +02001320
1321 DONE_GITWEB:
1322 1;
d04d3d42 Jakub Narębski2006-09-19 21:53:22 +02001323}
a0446e7b Sam Vilain2010-05-07 14:54:05 +02001324
c2394fe9 Jakub Narębski2010-05-07 14:54:04 +02001325run();
09bd7898 Kay Sievers2005-08-07 20:21:23 +02001326
5ed2ec10
JN
Jakub Narębski2010-06-13 12:09:32 +02001327if (defined caller) {
1328 # wrapped in a subroutine processing requests,
1329 # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1330 return;
1331} else {
1332 # pure CGI script, serving single request
1333 exit;
1334}
09bd7898 Kay Sievers2005-08-07 20:21:23 +02001335
717b8311 Jakub Narębski2006-07-31 21:22:15 +02001336## ======================================================================
06a9d86b
MW
Martin Waitz2006-08-16 00:23:50 +02001337## action links
1338
377bee34
JN
Jakub Narębski2010-04-24 15:53:19 +02001339# possible values of extra options
1340# -full => 0|1 - use absolute/full URL ($my_uri/$my_url as base)
1341# -replay => 1 - start from a current view (replay with modifications)
1342# -path_info => 0|1 - don't use/use path_info URL (if possible)
5e96a847 Kevin Cernekee2011-03-18 17:00:16 +01001343# -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
74fd8728 Jakub Narębski2009-05-07 19:11:29 +02001344sub href {
498fe002 Jakub Narębski2006-08-22 19:05:25 +02001345 my %params = @_;
bd5d1e42
JN
Jakub Narębski2006-11-19 15:05:21 +01001346 # default is to use -absolute url() i.e. $my_uri
1347 my $href = $params{-full} ? $my_url : $my_uri;
498fe002 Jakub Narębski2006-08-22 19:05:25 +02001348
5e96a847
KC
Kevin Cernekee2011-03-18 17:00:16 +01001349 # implicit -replay, must be first of implicit params
1350 $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1351
afa9b620
JN
Jakub Narębski2008-02-14 09:22:30 +01001352 $params{'project'} = $project unless exists $params{'project'};
1353
1cad283a Jakub Narębski2007-11-01 13:06:27 +01001354 if ($params{-replay}) {
1b2d297e Giuseppe Bilotta2008-10-10 20:42:26 +02001355 while (my ($name, $symbol) = each %cgi_param_mapping) {
1cad283a Jakub Narębski2007-11-01 13:06:27 +01001356 if (!exists $params{$name}) {
1b2d297e Giuseppe Bilotta2008-10-10 20:42:26 +02001357 $params{$name} = $input_params{$name};
1cad283a
JN
Jakub Narębski2007-11-01 13:06:27 +01001358 }
1359 }
1360 }
1361
25b2790f Giuseppe Bilotta2008-11-29 13:07:29 -08001362 my $use_pathinfo = gitweb_check_feature('pathinfo');
377bee34
JN
Jakub Narębski2010-04-24 15:53:19 +02001363 if (defined $params{'project'} &&
1364 (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
b02bd7a6
GB
Giuseppe Bilotta2008-10-21 21:34:51 +02001365 # try to put as many parameters as possible in PATH_INFO:
1366 # - project name
1367 # - action
8db49a7f Giuseppe Bilotta2008-10-21 21:34:54 +02001368 # - hash_parent or hash_parent_base:/file_parent
3550ea71 Giuseppe Bilotta2008-10-21 21:34:52 +02001369 # - hash or hash_base:/filename
c752a0e0 Giuseppe Bilotta2008-11-02 10:21:39 +01001370 # - the snapshot_format as an appropriate suffix
b02bd7a6
GB
Giuseppe Bilotta2008-10-21 21:34:51 +02001371
1372 # When the script is the root DirectoryIndex for the domain,
1373 # $href here would be something like http://gitweb.example.com/
1374 # Thus, we strip any trailing / from $href, to spare us double
1375 # slashes in the final URL
1376 $href =~ s,/$,,;
1377
1378 # Then add the project name, if present
67976c65 Jakub Narębski2010-12-14 16:54:31 +01001379 $href .= "/".esc_path_info($params{'project'});
9e756904
MW
Martin Waitz2006-10-01 23:57:48 +02001380 delete $params{'project'};
1381
c752a0e0
GB
Giuseppe Bilotta2008-11-02 10:21:39 +01001382 # since we destructively absorb parameters, we keep this
1383 # boolean that remembers if we're handling a snapshot
1384 my $is_snapshot = $params{'action'} eq 'snapshot';
1385
b02bd7a6
GB
Giuseppe Bilotta2008-10-21 21:34:51 +02001386 # Summary just uses the project path URL, any other action is
1387 # added to the URL
1388 if (defined $params{'action'}) {
67976c65
JN
Jakub Narębski2010-12-14 16:54:31 +01001389 $href .= "/".esc_path_info($params{'action'})
1390 unless $params{'action'} eq 'summary';
9e756904
MW
Martin Waitz2006-10-01 23:57:48 +02001391 delete $params{'action'};
1392 }
b02bd7a6 Giuseppe Bilotta2008-10-21 21:34:51 +02001393
8db49a7f
GB
Giuseppe Bilotta2008-10-21 21:34:54 +02001394 # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1395 # stripping nonexistent or useless pieces
1396 $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1397 || $params{'hash_parent'} || $params{'hash'});
b02bd7a6 Giuseppe Bilotta2008-10-21 21:34:51 +02001398 if (defined $params{'hash_base'}) {
8db49a7f Giuseppe Bilotta2008-10-21 21:34:54 +02001399 if (defined $params{'hash_parent_base'}) {
67976c65 Jakub Narębski2010-12-14 16:54:31 +01001400 $href .= esc_path_info($params{'hash_parent_base'});
8db49a7f Giuseppe Bilotta2008-10-21 21:34:54 +02001401 # skip the file_parent if it's the same as the file_name
b7da721f
GB
Giuseppe Bilotta2009-07-31 08:48:49 +02001402 if (defined $params{'file_parent'}) {
1403 if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1404 delete $params{'file_parent'};
1405 } elsif ($params{'file_parent'} !~ /\.\./) {
67976c65 Jakub Narębski2010-12-14 16:54:31 +01001406 $href .= ":/".esc_path_info($params{'file_parent'});
b7da721f
GB
Giuseppe Bilotta2009-07-31 08:48:49 +02001407 delete $params{'file_parent'};
1408 }
8db49a7f
GB
Giuseppe Bilotta2008-10-21 21:34:54 +02001409 }
1410 $href .= "..";
1411 delete $params{'hash_parent'};
1412 delete $params{'hash_parent_base'};
1413 } elsif (defined $params{'hash_parent'}) {
67976c65 Jakub Narębski2010-12-14 16:54:31 +01001414 $href .= esc_path_info($params{'hash_parent'}). "..";
8db49a7f
GB
Giuseppe Bilotta2008-10-21 21:34:54 +02001415 delete $params{'hash_parent'};
1416 }
1417
67976c65 Jakub Narębski2010-12-14 16:54:31 +01001418 $href .= esc_path_info($params{'hash_base'});
8db49a7f Giuseppe Bilotta2008-10-21 21:34:54 +02001419 if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
67976c65 Jakub Narębski2010-12-14 16:54:31 +01001420 $href .= ":/".esc_path_info($params{'file_name'});
b02bd7a6
GB
Giuseppe Bilotta2008-10-21 21:34:51 +02001421 delete $params{'file_name'};
1422 }
1423 delete $params{'hash'};
1424 delete $params{'hash_base'};
1425 } elsif (defined $params{'hash'}) {
67976c65 Jakub Narębski2010-12-14 16:54:31 +01001426 $href .= esc_path_info($params{'hash'});
b02bd7a6
GB
Giuseppe Bilotta2008-10-21 21:34:51 +02001427 delete $params{'hash'};
1428 }
c752a0e0
GB
Giuseppe Bilotta2008-11-02 10:21:39 +01001429
1430 # If the action was a snapshot, we can absorb the
1431 # snapshot_format parameter too
1432 if ($is_snapshot) {
1433 my $fmt = $params{'snapshot_format'};
1434 # snapshot_format should always be defined when href()
1435 # is called, but just in case some code forgets, we
1436 # fall back to the default
1437 $fmt ||= $snapshot_fmts[0];
1438 $href .= $known_snapshot_formats{$fmt}{'suffix'};
1439 delete $params{'snapshot_format'};
1440 }
9e756904
MW
Martin Waitz2006-10-01 23:57:48 +02001441 }
1442
1443 # now encode the parameters explicitly
498fe002 Jakub Narębski2006-08-22 19:05:25 +02001444 my @result = ();
1b2d297e
GB
Giuseppe Bilotta2008-10-10 20:42:26 +02001445 for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1446 my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
498fe002 Jakub Narębski2006-08-22 19:05:25 +02001447 if (defined $params{$name}) {
f22cca44
JN
Jakub Narębski2007-07-29 01:04:09 +02001448 if (ref($params{$name}) eq "ARRAY") {
1449 foreach my $par (@{$params{$name}}) {
1450 push @result, $symbol . "=" . esc_param($par);
1451 }
1452 } else {
1453 push @result, $symbol . "=" . esc_param($params{$name});
1454 }
498fe002
JN
Jakub Narębski2006-08-22 19:05:25 +02001455 }
1456 }
9e756904
MW
Martin Waitz2006-10-01 23:57:48 +02001457 $href .= "?" . join(';', @result) if scalar @result;
1458
67976c65
JN
Jakub Narębski2010-12-14 16:54:31 +01001459 # final transformation: trailing spaces must be escaped (URI-encoded)
1460 $href =~ s/(\s+)$/CGI::escape($1)/e;
1461
5e96a847
KC
Kevin Cernekee2011-03-18 17:00:16 +01001462 if ($params{-anchor}) {
1463 $href .= "#".esc_param($params{-anchor});
1464 }
1465
9e756904 Martin Waitz2006-10-01 23:57:48 +02001466 return $href;
06a9d86b
MW
Martin Waitz2006-08-16 00:23:50 +02001467}
1468
1469
1470## ======================================================================
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02001471## validation, quoting/unquoting and escaping
1472
23faf546
KN
Krzesimir Nowak2013-12-11 12:54:42 +01001473sub is_valid_action {
1474 my $input = shift;
1b2d297e Giuseppe Bilotta2008-10-10 20:42:26 +02001475 return undef unless exists $actions{$input};
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001476 return 1;
1b2d297e
GB
Giuseppe Bilotta2008-10-10 20:42:26 +02001477}
1478
23faf546
KN
Krzesimir Nowak2013-12-11 12:54:42 +01001479sub is_valid_project {
1480 my $input = shift;
1481
1482 return unless defined $input;
1483 if (!is_valid_pathname($input) ||
1b2d297e Giuseppe Bilotta2008-10-10 20:42:26 +02001484 !(-d "$projectroot/$input") ||
ec26f098 Alexander Gavrilov2008-11-06 01:15:56 +03001485 !check_export_ok("$projectroot/$input") ||
1b2d297e
GB
Giuseppe Bilotta2008-10-10 20:42:26 +02001486 ($strict_export && !project_in_list($input))) {
1487 return undef;
1488 } else {
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001489 return 1;
1b2d297e
GB
Giuseppe Bilotta2008-10-10 20:42:26 +02001490 }
1491}
1492
23faf546
KN
Krzesimir Nowak2013-12-11 12:54:42 +01001493sub is_valid_pathname {
1494 my $input = shift;
717b8311 Jakub Narębski2006-07-31 21:22:15 +02001495
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001496 return undef unless defined $input;
01689909 Justin Lebar2014-03-31 15:11:46 -07001497 # no '.' or '..' as elements of path, i.e. no '.' or '..'
24d0693a
JN
Jakub Narębski2006-09-26 01:57:02 +02001498 # at the beginning, at the end, and between slashes.
1499 # also this catches doubled slashes
1500 if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1501 return undef;
717b8311 Jakub Narębski2006-07-31 21:22:15 +02001502 }
24d0693a
JN
Jakub Narębski2006-09-26 01:57:02 +02001503 # no null characters
1504 if ($input =~ m!\0!) {
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02001505 return undef;
1506 }
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001507 return 1;
24d0693a
JN
Jakub Narębski2006-09-26 01:57:02 +02001508}
1509
c0bc2265 Krzesimir Nowak2013-12-11 12:54:41 +01001510sub is_valid_ref_format {
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001511 my $input = shift;
c0bc2265 Krzesimir Nowak2013-12-11 12:54:41 +01001512
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001513 return undef unless defined $input;
c0bc2265
KN
Krzesimir Nowak2013-12-11 12:54:41 +01001514 # restrictions on ref name according to git-check-ref-format
1515 if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1516 return undef;
1517 }
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001518 return 1;
c0bc2265
KN
Krzesimir Nowak2013-12-11 12:54:41 +01001519}
1520
23faf546
KN
Krzesimir Nowak2013-12-11 12:54:42 +01001521sub is_valid_refname {
1522 my $input = shift;
24d0693a Jakub Narębski2006-09-26 01:57:02 +02001523
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001524 return undef unless defined $input;
24d0693a
JN
Jakub Narębski2006-09-26 01:57:02 +02001525 # textual hashes are O.K.
1526 if ($input =~ m/^[0-9a-fA-F]{40}$/) {
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001527 return 1;
24d0693a
JN
Jakub Narębski2006-09-26 01:57:02 +02001528 }
1529 # it must be correct pathname
23faf546 Krzesimir Nowak2013-12-11 12:54:42 +01001530 is_valid_pathname($input) or return undef;
c0bc2265 Krzesimir Nowak2013-12-11 12:54:41 +01001531 # check git-check-ref-format restrictions
23faf546
KN
Krzesimir Nowak2013-12-11 12:54:42 +01001532 is_valid_ref_format($input) or return undef;
1533 return 1;
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02001534}
1535
00f429af
MK
Martin Koegler2007-06-03 17:42:44 +02001536# decode sequences of octets in utf8 into Perl's internal form,
1537# which is utf-8 with utf8 flag set if needed. gitweb writes out
1538# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1539sub to_utf8 {
1540 my $str = shift;
1df48766 Jakub Narębski2010-02-07 21:52:25 +01001541 return undef unless defined $str;
b13e3eac
JN
Jakub Narębski2011-12-18 23:00:58 +01001542
1543 if (utf8::is_utf8($str) || utf8::decode($str)) {
e5d3de5c İsmail Dönmez2007-12-04 10:55:41 +02001544 return $str;
00f429af
MK
Martin Koegler2007-06-03 17:42:44 +02001545 } else {
1546 return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1547 }
1548}
1549
232ff553
KS
Kay Sievers2005-11-24 16:56:55 +01001550# quote unsafe chars, but keep the slash, even when it's not
1551# correct, but quoted slashes look too horrible in bookmarks
1552sub esc_param {
353347b0 Kay Sievers2005-11-14 05:47:18 +01001553 my $str = shift;
1df48766 Jakub Narębski2010-02-07 21:52:25 +01001554 return undef unless defined $str;
452e2256 Giuseppe Bilotta2009-10-13 21:51:36 +02001555 $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
a9e60b7d Kay Sievers2005-11-14 15:15:12 +01001556 $str =~ s/ /\+/g;
353347b0
KS
Kay Sievers2005-11-14 05:47:18 +01001557 return $str;
1558}
1559
67976c65
JN
Jakub Narębski2010-12-14 16:54:31 +01001560# the quoting rules for path_info fragment are slightly different
1561sub esc_path_info {
1562 my $str = shift;
1563 return undef unless defined $str;
1564
1565 # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1566 $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1567
1568 return $str;
1569}
1570
22e5e58a Ralf Wildenhues2010-08-22 13:12:12 +02001571# quote unsafe chars in whole URL, so some characters cannot be quoted
f93bff8d
JN
Jakub Narębski2006-09-26 01:58:41 +02001572sub esc_url {
1573 my $str = shift;
1df48766 Jakub Narębski2010-02-07 21:52:25 +01001574 return undef unless defined $str;
109988f2 Pavan Kumar Sunkara2010-07-15 12:59:01 +05301575 $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
f93bff8d
JN
Jakub Narębski2006-09-26 01:58:41 +02001576 $str =~ s/ /\+/g;
1577 return $str;
1578}
1579
3017ed62
JN
Jakub Narębski2010-12-15 00:34:01 +01001580# quote unsafe characters in HTML attributes
1581sub esc_attr {
1582
1583 # for XHTML conformance escaping '"' to '&quot;' is not enough
1584 return esc_html(@_);
1585}
1586
232ff553 Kay Sievers2005-11-24 16:56:55 +01001587# replace invalid utf8 character with SUBSTITUTION sequence
74fd8728 Jakub Narębski2009-05-07 19:11:29 +02001588sub esc_html {
40c13813 Kay Sievers2005-11-19 17:41:29 +01001589 my $str = shift;
6255ef08
JN
Jakub Narębski2006-11-01 14:33:21 +01001590 my %opts = @_;
1591
1df48766
JN
Jakub Narębski2010-02-07 21:52:25 +01001592 return undef unless defined $str;
1593
00f429af Martin Koegler2007-06-03 17:42:44 +02001594 $str = to_utf8($str);
c390ae97 Li Yang2007-03-06 11:58:56 +08001595 $str = $cgi->escapeHTML($str);
6255ef08
JN
Jakub Narębski2006-11-01 14:33:21 +01001596 if ($opts{'-nbsp'}) {
1597 $str =~ s/ /&nbsp;/g;
1598 }
25ffbb27 Junio C Hamano2006-11-08 15:11:10 -08001599 $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
40c13813
KS
Kay Sievers2005-11-19 17:41:29 +01001600 return $str;
1601}
1602
391862e3
JN
Jakub Narębski2006-11-25 09:43:59 +01001603# quote control characters and escape filename to HTML
1604sub esc_path {
1605 my $str = shift;
1606 my %opts = @_;
1607
1df48766
JN
Jakub Narębski2010-02-07 21:52:25 +01001608 return undef unless defined $str;
1609
00f429af Martin Koegler2007-06-03 17:42:44 +02001610 $str = to_utf8($str);
c390ae97 Li Yang2007-03-06 11:58:56 +08001611 $str = $cgi->escapeHTML($str);
391862e3
JN
Jakub Narębski2006-11-25 09:43:59 +01001612 if ($opts{'-nbsp'}) {
1613 $str =~ s/ /&nbsp;/g;
1614 }
1615 $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1616 return $str;
1617}
1618
0866786b
JN
Jakub Narębski2011-09-16 14:41:57 +02001619# Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1620sub sanitize {
1621 my $str = shift;
1622
1623 return undef unless defined $str;
1624
1625 $str = to_utf8($str);
0e901d24 Orgad Shaneh2012-12-30 13:52:53 +02001626 $str =~ s|([[:cntrl:]])|(index("\t\n\r", $1) != -1 ? $1 : quot_cec($1))|eg;
0866786b
JN
Jakub Narębski2011-09-16 14:41:57 +02001627 return $str;
1628}
1629
391862e3 Jakub Narębski2006-11-25 09:43:59 +01001630# Make control characters "printable", using character escape codes (CEC)
1d3bc0cc
JN
Jakub Narębski2006-11-08 11:50:07 +01001631sub quot_cec {
1632 my $cntrl = shift;
c84c483f Jakub Narębski2008-02-17 18:48:13 +01001633 my %opts = @_;
1d3bc0cc Jakub Narębski2006-11-08 11:50:07 +01001634 my %es = ( # character escape codes, aka escape sequences
c84c483f
JN
Jakub Narębski2008-02-17 18:48:13 +01001635 "\t" => '\t', # tab (HT)
1636 "\n" => '\n', # line feed (LF)
1637 "\r" => '\r', # carrige return (CR)
1638 "\f" => '\f', # form feed (FF)
1639 "\b" => '\b', # backspace (BS)
1640 "\a" => '\a', # alarm (bell) (BEL)
1641 "\e" => '\e', # escape (ESC)
1642 "\013" => '\v', # vertical tab (VT)
1643 "\000" => '\0', # nul character (NUL)
1644 );
1d3bc0cc
JN
Jakub Narębski2006-11-08 11:50:07 +01001645 my $chr = ( (exists $es{$cntrl})
1646 ? $es{$cntrl}
25dfd171 Petr Baudis2008-10-01 22:11:54 +02001647 : sprintf('\%2x', ord($cntrl)) );
c84c483f
JN
Jakub Narębski2008-02-17 18:48:13 +01001648 if ($opts{-nohtml}) {
1649 return $chr;
1650 } else {
1651 return "<span class=\"cntrl\">$chr</span>";
1652 }
1d3bc0cc
JN
Jakub Narębski2006-11-08 11:50:07 +01001653}
1654
391862e3
JN
Jakub Narębski2006-11-25 09:43:59 +01001655# Alternatively use unicode control pictures codepoints,
1656# Unicode "printable representation" (PR)
1d3bc0cc
JN
Jakub Narębski2006-11-08 11:50:07 +01001657sub quot_upr {
1658 my $cntrl = shift;
c84c483f
JN
Jakub Narębski2008-02-17 18:48:13 +01001659 my %opts = @_;
1660
1d3bc0cc Jakub Narębski2006-11-08 11:50:07 +01001661 my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
c84c483f
JN
Jakub Narębski2008-02-17 18:48:13 +01001662 if ($opts{-nohtml}) {
1663 return $chr;
1664 } else {
1665 return "<span class=\"cntrl\">$chr</span>";
1666 }
1d3bc0cc
JN
Jakub Narębski2006-11-08 11:50:07 +01001667}
1668
232ff553
KS
Kay Sievers2005-11-24 16:56:55 +01001669# git may return quoted and escaped filenames
1670sub unquote {
1671 my $str = shift;
403d0906
JN
Jakub Narębski2006-11-08 11:48:56 +01001672
1673 sub unq {
1674 my $seq = shift;
1675 my %es = ( # character escape codes, aka escape sequences
1676 't' => "\t", # tab (HT, TAB)
1677 'n' => "\n", # newline (NL)
1678 'r' => "\r", # return (CR)
1679 'f' => "\f", # form feed (FF)
1680 'b' => "\b", # backspace (BS)
1681 'a' => "\a", # alarm (bell) (BEL)
1682 'e' => "\e", # escape (ESC)
1683 'v' => "\013", # vertical tab (VT)
1684 );
1685
1686 if ($seq =~ m/^[0-7]{1,3}$/) {
1687 # octal char sequence
1688 return chr(oct($seq));
1689 } elsif (exists $es{$seq}) {
1690 # C escape sequence, aka character escape code
c84c483f Jakub Narębski2008-02-17 18:48:13 +01001691 return $es{$seq};
403d0906
JN
Jakub Narębski2006-11-08 11:48:56 +01001692 }
1693 # quoted ordinary character
1694 return $seq;
1695 }
1696
232ff553 Kay Sievers2005-11-24 16:56:55 +01001697 if ($str =~ m/^"(.*)"$/) {
403d0906 Jakub Narębski2006-11-08 11:48:56 +01001698 # needs unquoting
232ff553 Kay Sievers2005-11-24 16:56:55 +01001699 $str = $1;
403d0906 Jakub Narębski2006-11-08 11:48:56 +01001700 $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
232ff553
KS
Kay Sievers2005-11-24 16:56:55 +01001701 }
1702 return $str;
1703}
1704
f16db173
JN
Jakub Narębski2006-08-06 02:08:31 +02001705# escape tabs (convert tabs to spaces)
1706sub untabify {
1707 my $line = shift;
1708
1709 while ((my $pos = index($line, "\t")) != -1) {
1710 if (my $count = (8 - ($pos % 8))) {
1711 my $spaces = ' ' x $count;
1712 $line =~ s/\t/$spaces/;
1713 }
1714 }
1715
1716 return $line;
1717}
1718
32f4aacc
ML
Matthias Lederhofer2006-09-17 00:31:01 +02001719sub project_in_list {
1720 my $project = shift;
1721 my @list = git_get_projects_list();
1722 return @list && scalar(grep { $_->{'path'} eq $project } @list);
1723}
1724
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02001725## ----------------------------------------------------------------------
1726## HTML aware string manipulation
1727
b8d97d07
JN
Jakub Narębski2008-02-25 21:07:57 +01001728# Try to chop given string on a word boundary between position
1729# $len and $len+$add_len. If there is no word boundary there,
1730# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1731# (marking chopped part) would be longer than given string.
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02001732sub chop_str {
1733 my $str = shift;
1734 my $len = shift;
1735 my $add_len = shift || 10;
b8d97d07 Jakub Narębski2008-02-25 21:07:57 +01001736 my $where = shift || 'right'; # 'left' | 'center' | 'right'
717b8311 Jakub Narębski2006-07-31 21:22:15 +02001737
dee2775a
AW
Anders Waldenborg2008-05-21 13:44:43 +02001738 # Make sure perl knows it is utf8 encoded so we don't
1739 # cut in the middle of a utf8 multibyte char.
1740 $str = to_utf8($str);
1741
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02001742 # allow only $len chars, but don't cut a word if it would fit in $add_len
1743 # if it doesn't fit, cut it if it's still longer than the dots we would add
b8d97d07
JN
Jakub Narębski2008-02-25 21:07:57 +01001744 # remove chopped character entities entirely
1745
1746 # when chopping in the middle, distribute $len into left and right part
1747 # return early if chopping wouldn't make string shorter
1748 if ($where eq 'center') {
1749 return $str if ($len + 5 >= length($str)); # filler is length 5
1750 $len = int($len/2);
1751 } else {
1752 return $str if ($len + 4 >= length($str)); # filler is length 4
1753 }
1754
1755 # regexps: ending and beginning with word part up to $add_len
1756 my $endre = qr/.{$len}\w{0,$add_len}/;
1757 my $begre = qr/\w{0,$add_len}.{$len}/;
1758
1759 if ($where eq 'left') {
1760 $str =~ m/^(.*?)($begre)$/;
1761 my ($lead, $body) = ($1, $2);
1762 if (length($lead) > 4) {
b8d97d07
JN
Jakub Narębski2008-02-25 21:07:57 +01001763 $lead = " ...";
1764 }
1765 return "$lead$body";
1766
1767 } elsif ($where eq 'center') {
1768 $str =~ m/^($endre)(.*)$/;
1769 my ($left, $str) = ($1, $2);
1770 $str =~ m/^(.*?)($begre)$/;
1771 my ($mid, $right) = ($1, $2);
1772 if (length($mid) > 5) {
b8d97d07
JN
Jakub Narębski2008-02-25 21:07:57 +01001773 $mid = " ... ";
1774 }
1775 return "$left$mid$right";
1776
1777 } else {
1778 $str =~ m/^($endre)(.*)$/;
1779 my $body = $1;
1780 my $tail = $2;
1781 if (length($tail) > 4) {
b8d97d07
JN
Jakub Narębski2008-02-25 21:07:57 +01001782 $tail = "... ";
1783 }
1784 return "$body$tail";
717b8311 Jakub Narębski2006-07-31 21:22:15 +02001785 }
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02001786}
1787
ce58ec91
DS
David Symonds2007-10-23 11:31:22 +10001788# takes the same arguments as chop_str, but also wraps a <span> around the
1789# result with a title attribute if it does get chopped. Additionally, the
1790# string is HTML-escaped.
1791sub chop_and_escape_str {
b8d97d07 Jakub Narębski2008-02-25 21:07:57 +01001792 my ($str) = @_;
ce58ec91 David Symonds2007-10-23 11:31:22 +10001793
b8d97d07 Jakub Narębski2008-02-25 21:07:57 +01001794 my $chopped = chop_str(@_);
168c1e01 Jürgen Kreileder2011-12-17 10:22:21 +01001795 $str = to_utf8($str);
ce58ec91
DS
David Symonds2007-10-23 11:31:22 +10001796 if ($chopped eq $str) {
1797 return esc_html($chopped);
1798 } else {
14afe774 Jakub Narębski2009-05-22 17:35:46 +02001799 $str =~ s/[[:cntrl:]]/?/g;
850b90a5 Jakub Narębski2008-02-16 23:07:46 +01001800 return $cgi->span({-title=>$str}, esc_html($chopped));
ce58ec91
DS
David Symonds2007-10-23 11:31:22 +10001801 }
1802}
1803
337da8d2
JN
Jakub Narębski2012-02-27 02:55:19 +01001804# Highlight selected fragments of string, using given CSS class,
1805# and escape HTML. It is assumed that fragments do not overlap.
1806# Regions are passed as list of pairs (array references).
1807#
1808# Example: esc_html_hl_regions("foobar", "mark", [ 0, 3 ]) returns
1809# '<span class="mark">foo</span>bar'
1810sub esc_html_hl_regions {
1811 my ($str, $css_class, @sel) = @_;
9768a9d8
JN
Jakub Narębski2012-04-11 23:18:39 +02001812 my %opts = grep { ref($_) ne 'ARRAY' } @sel;
1813 @sel = grep { ref($_) eq 'ARRAY' } @sel;
1814 return esc_html($str, %opts) unless @sel;
337da8d2
JN
Jakub Narębski2012-02-27 02:55:19 +01001815
1816 my $out = '';
1817 my $pos = 0;
1818
1819 for my $s (@sel) {
ce61fb96 Michał Kiedrowicz2012-04-11 23:18:37 +02001820 my ($begin, $end) = @$s;
337da8d2 Jakub Narębski2012-02-27 02:55:19 +01001821
cbbea3df
MK
Michał Kiedrowicz2012-04-11 23:18:38 +02001822 # Don't create empty <span> elements.
1823 next if $end <= $begin;
1824
9768a9d8
JN
Jakub Narębski2012-04-11 23:18:39 +02001825 my $escaped = esc_html(substr($str, $begin, $end - $begin),
1826 %opts);
ce61fb96 Michał Kiedrowicz2012-04-11 23:18:37 +02001827
9768a9d8 Jakub Narębski2012-04-11 23:18:39 +02001828 $out .= esc_html(substr($str, $pos, $begin - $pos), %opts)
ce61fb96
MK
Michał Kiedrowicz2012-04-11 23:18:37 +02001829 if ($begin - $pos > 0);
1830 $out .= $cgi->span({-class => $css_class}, $escaped);
1831
1832 $pos = $end;
337da8d2 Jakub Narębski2012-02-27 02:55:19 +01001833 }
9768a9d8 Jakub Narębski2012-04-11 23:18:39 +02001834 $out .= esc_html(substr($str, $pos), %opts)
337da8d2
JN
Jakub Narębski2012-02-27 02:55:19 +01001835 if ($pos < length($str));
1836
1837 return $out;
1838}
1839
e607b79f
JN
Jakub Narębski2012-02-27 02:55:22 +01001840# return positions of beginning and end of each match
1841sub matchpos_list {
337da8d2 Jakub Narębski2012-02-27 02:55:19 +01001842 my ($str, $regexp) = @_;
e607b79f Jakub Narębski2012-02-27 02:55:22 +01001843 return unless (defined $str && defined $regexp);
337da8d2
JN
Jakub Narębski2012-02-27 02:55:19 +01001844
1845 my @matches;
1846 while ($str =~ /$regexp/g) {
1847 push @matches, [$-[0], $+[0]];
1848 }
e607b79f
JN
Jakub Narębski2012-02-27 02:55:22 +01001849 return @matches;
1850}
1851
1852# highlight match (if any), and escape HTML
1853sub esc_html_match_hl {
1854 my ($str, $regexp) = @_;
1855 return esc_html($str) unless defined $regexp;
1856
1857 my @matches = matchpos_list($str, $regexp);
337da8d2
JN
Jakub Narębski2012-02-27 02:55:19 +01001858 return esc_html($str) unless @matches;
1859
1860 return esc_html_hl_regions($str, 'match', @matches);
1861}
1862
e607b79f
JN
Jakub Narębski2012-02-27 02:55:22 +01001863
1864# highlight match (if any) of shortened string, and escape HTML
1865sub esc_html_match_hl_chopped {
1866 my ($str, $chopped, $regexp) = @_;
1867 return esc_html_match_hl($str, $regexp) unless defined $chopped;
1868
1869 my @matches = matchpos_list($str, $regexp);
1870 return esc_html($chopped) unless @matches;
1871
1872 # filter matches so that we mark chopped string
1873 my $tail = "... "; # see chop_str
1874 unless ($chopped =~ s/\Q$tail\E$//) {
1875 $tail = '';
1876 }
1877 my $chop_len = length($chopped);
1878 my $tail_len = length($tail);
1879 my @filtered;
1880
1881 for my $m (@matches) {
1882 if ($m->[0] > $chop_len) {
1883 push @filtered, [ $chop_len, $chop_len + $tail_len ] if ($tail_len > 0);
1884 last;
1885 } elsif ($m->[1] > $chop_len) {
1886 push @filtered, [ $m->[0], $chop_len + $tail_len ];
1887 last;
1888 }
1889 push @filtered, $m;
1890 }
1891
1892 return esc_html_hl_regions($chopped . $tail, 'match', @filtered);
1893}
1894
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02001895## ----------------------------------------------------------------------
1896## functions returning short strings
1897
1f1ab5f0
JN
Jakub Narębski2006-06-20 14:58:12 +00001898# CSS class for given age value (in seconds)
1899sub age_class {
1900 my $age = shift;
1901
785cdea9
JN
Jakub Narębski2007-05-13 12:39:22 +02001902 if (!defined $age) {
1903 return "noage";
1904 } elsif ($age < 60*60*2) {
1f1ab5f0
JN
Jakub Narębski2006-06-20 14:58:12 +00001905 return "age0";
1906 } elsif ($age < 60*60*24*2) {
1907 return "age1";
1908 } else {
1909 return "age2";
1910 }
1911}
1912
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02001913# convert age in seconds to "nn units ago" string
1914sub age_string {
1915 my $age = shift;
1916 my $age_str;
a59d4afd Kay Sievers2005-08-07 20:15:44 +02001917
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02001918 if ($age > 60*60*24*365*2) {
1919 $age_str = (int $age/60/60/24/365);
1920 $age_str .= " years ago";
1921 } elsif ($age > 60*60*24*(365/12)*2) {
1922 $age_str = int $age/60/60/24/(365/12);
1923 $age_str .= " months ago";
1924 } elsif ($age > 60*60*24*7*2) {
1925 $age_str = int $age/60/60/24/7;
1926 $age_str .= " weeks ago";
1927 } elsif ($age > 60*60*24*2) {
1928 $age_str = int $age/60/60/24;
1929 $age_str .= " days ago";
1930 } elsif ($age > 60*60*2) {
1931 $age_str = int $age/60/60;
1932 $age_str .= " hours ago";
1933 } elsif ($age > 60*2) {
1934 $age_str = int $age/60;
1935 $age_str .= " min ago";
1936 } elsif ($age > 2) {
1937 $age_str = int $age;
1938 $age_str .= " sec ago";
f6801d66 Alp Toker2006-07-11 11:19:34 +01001939 } else {
717b8311 Jakub Narębski2006-07-31 21:22:15 +02001940 $age_str .= " right now";
4c02e3c5 Kay Sievers2005-08-07 19:52:52 +02001941 }
717b8311 Jakub Narębski2006-07-31 21:22:15 +02001942 return $age_str;
161332a5
KS
Kay Sievers2005-08-07 19:49:46 +02001943}
1944
01ac1e38
JN
Jakub Narębski2007-07-28 16:27:31 +02001945use constant {
1946 S_IFINVALID => 0030000,
1947 S_IFGITLINK => 0160000,
1948};
1949
1950# submodule/subproject, a commit object reference
74fd8728 Jakub Narębski2009-05-07 19:11:29 +02001951sub S_ISGITLINK {
01ac1e38
JN
Jakub Narębski2007-07-28 16:27:31 +02001952 my $mode = shift;
1953
1954 return (($mode & S_IFMT) == S_IFGITLINK)
1955}
1956
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02001957# convert file mode in octal to symbolic file mode string
1958sub mode_str {
1959 my $mode = oct shift;
1960
01ac1e38
JN
Jakub Narębski2007-07-28 16:27:31 +02001961 if (S_ISGITLINK($mode)) {
1962 return 'm---------';
1963 } elsif (S_ISDIR($mode & S_IFMT)) {
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02001964 return 'drwxr-xr-x';
1965 } elsif (S_ISLNK($mode)) {
1966 return 'lrwxrwxrwx';
1967 } elsif (S_ISREG($mode)) {
1968 # git cares only about the executable bit
1969 if ($mode & S_IXUSR) {
1970 return '-rwxr-xr-x';
1971 } else {
1972 return '-rw-r--r--';
1973 };
c994d620 Kay Sievers2005-08-07 20:27:18 +02001974 } else {
717b8311 Jakub Narębski2006-07-31 21:22:15 +02001975 return '----------';
ff7669a5 Kay Sievers2005-08-07 20:13:02 +02001976 }
161332a5
KS
Kay Sievers2005-08-07 19:49:46 +02001977}
1978
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02001979# convert file mode in octal to file type string
1980sub file_type {
7c5e2ebb
JN
Jakub Narębski2006-08-25 21:13:34 +02001981 my $mode = shift;
1982
1983 if ($mode !~ m/^[0-7]+$/) {
1984 return $mode;
1985 } else {
1986 $mode = oct $mode;
1987 }
664f4cc5 Kay Sievers2005-08-07 20:17:19 +02001988
01ac1e38
JN
Jakub Narębski2007-07-28 16:27:31 +02001989 if (S_ISGITLINK($mode)) {
1990 return "submodule";
1991 } elsif (S_ISDIR($mode & S_IFMT)) {
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02001992 return "directory";
1993 } elsif (S_ISLNK($mode)) {
1994 return "symlink";
1995 } elsif (S_ISREG($mode)) {
1996 return "file";
1997 } else {
1998 return "unknown";
1999 }
a59d4afd
KS
Kay Sievers2005-08-07 20:15:44 +02002000}
2001
744d0ac3
JN
Jakub Narębski2006-11-08 17:59:41 +01002002# convert file mode in octal to file type description string
2003sub file_type_long {
2004 my $mode = shift;
2005
2006 if ($mode !~ m/^[0-7]+$/) {
2007 return $mode;
2008 } else {
2009 $mode = oct $mode;
2010 }
2011
01ac1e38
JN
Jakub Narębski2007-07-28 16:27:31 +02002012 if (S_ISGITLINK($mode)) {
2013 return "submodule";
2014 } elsif (S_ISDIR($mode & S_IFMT)) {
744d0ac3
JN
Jakub Narębski2006-11-08 17:59:41 +01002015 return "directory";
2016 } elsif (S_ISLNK($mode)) {
2017 return "symlink";
2018 } elsif (S_ISREG($mode)) {
2019 if ($mode & S_IXUSR) {
2020 return "executable";
2021 } else {
2022 return "file";
2023 };
2024 } else {
2025 return "unknown";
2026 }
2027}
2028
2029
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02002030## ----------------------------------------------------------------------
2031## functions returning short HTML fragments, or transforming HTML fragments
3dff5379 Pavel Roskin2007-02-03 23:49:16 -05002032## which don't belong to other sections
b18f9bf4 Jakub Narębski2006-07-30 14:59:57 +02002033
225932ed Junio C Hamano2006-11-09 00:57:13 -08002034# format line of commit message.
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02002035sub format_log_line_html {
2036 my $line = shift;
b18f9bf4 Jakub Narębski2006-07-30 14:59:57 +02002037
225932ed Junio C Hamano2006-11-09 00:57:13 -08002038 $line = esc_html($line, -nbsp=>1);
7d233dea
MC
Marcel M. Cary2009-02-17 19:00:43 -08002039 $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
2040 $cgi->a({-href => href(action=>"object", hash=>$1),
2041 -class => "text"}, $1);
2042 }eg;
2043
717b8311 Jakub Narębski2006-07-31 21:22:15 +02002044 return $line;
b18f9bf4
JN
Jakub Narębski2006-07-30 14:59:57 +02002045}
2046
717b8311 Jakub Narębski2006-07-31 21:22:15 +02002047# format marker of refs pointing to given object
4afbaeff
GB
Giuseppe Bilotta2008-09-02 21:47:05 +02002048
2049# the destination action is chosen based on object type and current context:
2050# - for annotated tags, we choose the tag view unless it's the current view
2051# already, in which case we go to shortlog view
2052# - for other refs, we keep the current view if we're in history, shortlog or
2053# log view, and select shortlog otherwise
847e01fb Jakub Narębski2006-08-14 02:05:47 +02002054sub format_ref_marker {
717b8311 Jakub Narębski2006-07-31 21:22:15 +02002055 my ($refs, $id) = @_;
d294e1ca Jakub Narębski2006-08-14 02:14:20 +02002056 my $markers = '';
27fb8c40 Jakub Narębski2006-07-30 20:32:01 +02002057
717b8311 Jakub Narębski2006-07-31 21:22:15 +02002058 if (defined $refs->{$id}) {
d294e1ca Jakub Narębski2006-08-14 02:14:20 +02002059 foreach my $ref (@{$refs->{$id}}) {
4afbaeff
GB
Giuseppe Bilotta2008-09-02 21:47:05 +02002060 # this code exploits the fact that non-lightweight tags are the
2061 # only indirect objects, and that they are the only objects for which
2062 # we want to use tag instead of shortlog as action
d294e1ca Jakub Narębski2006-08-14 02:14:20 +02002063 my ($type, $name) = qw();
4afbaeff Giuseppe Bilotta2008-09-02 21:47:05 +02002064 my $indirect = ($ref =~ s/\^\{\}$//);
d294e1ca
JN
Jakub Narębski2006-08-14 02:14:20 +02002065 # e.g. tags/v2.6.11 or heads/next
2066 if ($ref =~ m!^(.*?)s?/(.*)$!) {
2067 $type = $1;
2068 $name = $2;
2069 } else {
2070 $type = "ref";
2071 $name = $ref;
2072 }
2073
4afbaeff
GB
Giuseppe Bilotta2008-09-02 21:47:05 +02002074 my $class = $type;
2075 $class .= " indirect" if $indirect;
2076
2077 my $dest_action = "shortlog";
2078
2079 if ($indirect) {
2080 $dest_action = "tag" unless $action eq "tag";
2081 } elsif ($action =~ /^(history|(short)?log)$/) {
2082 $dest_action = $action;
2083 }
2084
2085 my $dest = "";
2086 $dest .= "refs/" unless $ref =~ m!^refs/!;
2087 $dest .= $ref;
2088
2089 my $link = $cgi->a({
2090 -href => href(
2091 action=>$dest_action,
2092 hash=>$dest
2093 )}, $name);
2094
3017ed62 Jakub Narębski2010-12-15 00:34:01 +01002095 $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
4afbaeff Giuseppe Bilotta2008-09-02 21:47:05 +02002096 $link . "</span>";
d294e1ca
JN
Jakub Narębski2006-08-14 02:14:20 +02002097 }
2098 }
2099
2100 if ($markers) {
2101 return ' <span class="refs">'. $markers . '</span>';
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02002102 } else {
2103 return "";
2104 }
27fb8c40
JN
Jakub Narębski2006-07-30 20:32:01 +02002105}
2106
17d07443
JN
Jakub Narębski2006-08-14 02:08:27 +02002107# format, perhaps shortened and with markers, title line
2108sub format_subject_html {
1c2a4f5a Martin Waitz2006-08-16 00:24:30 +02002109 my ($long, $short, $href, $extra) = @_;
17d07443
JN
Jakub Narębski2006-08-14 02:08:27 +02002110 $extra = '' unless defined($extra);
2111
2112 if (length($short) < length($long)) {
14afe774 Jakub Narębski2009-05-22 17:35:46 +02002113 $long =~ s/[[:cntrl:]]/?/g;
7c278014 Jakub Narębski2006-08-22 12:02:48 +02002114 return $cgi->a({-href => $href, -class => "list subject",
00f429af Martin Koegler2007-06-03 17:42:44 +02002115 -title => to_utf8($long)},
01b89f0c Giuseppe Bilotta2009-08-23 10:28:09 +02002116 esc_html($short)) . $extra;
17d07443 Jakub Narębski2006-08-14 02:08:27 +02002117 } else {
7c278014 Jakub Narębski2006-08-22 12:02:48 +02002118 return $cgi->a({-href => $href, -class => "list subject"},
01b89f0c Giuseppe Bilotta2009-08-23 10:28:09 +02002119 esc_html($long)) . $extra;
17d07443
JN
Jakub Narębski2006-08-14 02:08:27 +02002120 }
2121}
2122
5a371b7b
GB
Giuseppe Bilotta2009-06-30 00:00:52 +02002123# Rather than recomputing the url for an email multiple times, we cache it
2124# after the first hit. This gives a visible benefit in views where the avatar
2125# for the same email is used repeatedly (e.g. shortlog).
2126# The cache is shared by all avatar engines (currently gravatar only), which
2127# are free to use it as preferred. Since only one avatar engine is used for any
2128# given page, there's no risk for cache conflicts.
2129our %avatar_cache = ();
2130
679a1a1d
GB
Giuseppe Bilotta2009-06-30 00:00:53 +02002131# Compute the picon url for a given email, by using the picon search service over at
2132# http://www.cs.indiana.edu/picons/search.html
2133sub picon_url {
2134 my $email = lc shift;
2135 if (!$avatar_cache{$email}) {
2136 my ($user, $domain) = split('@', $email);
2137 $avatar_cache{$email} =
57485581 Andrej E Baranov2013-01-29 00:41:32 +01002138 "//www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
679a1a1d
GB
Giuseppe Bilotta2009-06-30 00:00:53 +02002139 "$domain/$user/" .
2140 "users+domains+unknown/up/single";
2141 }
2142 return $avatar_cache{$email};
2143}
2144
5a371b7b
GB
Giuseppe Bilotta2009-06-30 00:00:52 +02002145# Compute the gravatar url for a given email, if it's not in the cache already.
2146# Gravatar stores only the part of the URL before the size, since that's the
2147# one computationally more expensive. This also allows reuse of the cache for
2148# different sizes (for this particular engine).
2149sub gravatar_url {
2150 my $email = lc shift;
2151 my $size = shift;
2152 $avatar_cache{$email} ||=
57485581 Andrej E Baranov2013-01-29 00:41:32 +01002153 "//www.gravatar.com/avatar/" .
5a371b7b
GB
Giuseppe Bilotta2009-06-30 00:00:52 +02002154 Digest::MD5::md5_hex($email) . "?s=";
2155 return $avatar_cache{$email} . $size;
2156}
2157
e9fdd74e
GB
Giuseppe Bilotta2009-06-30 00:00:51 +02002158# Insert an avatar for the given $email at the given $size if the feature
2159# is enabled.
2160sub git_get_avatar {
2161 my ($email, %opts) = @_;
2162 my $pre_white = ($opts{-pad_before} ? "&nbsp;" : "");
2163 my $post_white = ($opts{-pad_after} ? "&nbsp;" : "");
2164 $opts{-size} ||= 'default';
2165 my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
2166 my $url = "";
2167 if ($git_avatar eq 'gravatar') {
5a371b7b Giuseppe Bilotta2009-06-30 00:00:52 +02002168 $url = gravatar_url($email, $size);
679a1a1d
GB
Giuseppe Bilotta2009-06-30 00:00:53 +02002169 } elsif ($git_avatar eq 'picon') {
2170 $url = picon_url($email);
e9fdd74e Giuseppe Bilotta2009-06-30 00:00:51 +02002171 }
679a1a1d Giuseppe Bilotta2009-06-30 00:00:53 +02002172 # Other providers can be added by extending the if chain, defining $url
e9fdd74e
GB
Giuseppe Bilotta2009-06-30 00:00:51 +02002173 # as needed. If no variant puts something in $url, we assume avatars
2174 # are completely disabled/unavailable.
2175 if ($url) {
2176 return $pre_white .
2177 "<img width=\"$size\" " .
2178 "class=\"avatar\" " .
3017ed62 Jakub Narębski2010-12-15 00:34:01 +01002179 "src=\"".esc_url($url)."\" " .
7d25ef41 Giuseppe Bilotta2009-06-30 00:00:54 +02002180 "alt=\"\" " .
e9fdd74e
GB
Giuseppe Bilotta2009-06-30 00:00:51 +02002181 "/>" . $post_white;
2182 } else {
2183 return "";
2184 }
2185}
2186
e133d65c
SB
Stephen Boyd2009-10-15 21:14:59 -07002187sub format_search_author {
2188 my ($author, $searchtype, $displaytext) = @_;
2189 my $have_search = gitweb_check_feature('search');
2190
2191 if ($have_search) {
2192 my $performed = "";
2193 if ($searchtype eq 'author') {
2194 $performed = "authored";
2195 } elsif ($searchtype eq 'committer') {
2196 $performed = "committed";
2197 }
2198
2199 return $cgi->a({-href => href(action=>"search", hash=>$hash,
2200 searchtext=>$author,
2201 searchtype=>$searchtype), class=>"list",
2202 title=>"Search for commits $performed by $author"},
2203 $displaytext);
2204
2205 } else {
2206 return $displaytext;
2207 }
2208}
2209
1c49a4e1
GB
Giuseppe Bilotta2009-06-30 00:00:48 +02002210# format the author name of the given commit with the given tag
2211# the author name is chopped and escaped according to the other
2212# optional parameters (see chop_str).
2213sub format_author_html {
2214 my $tag = shift;
2215 my $co = shift;
2216 my $author = chop_and_escape_str($co->{'author_name'}, @_);
e9fdd74e Giuseppe Bilotta2009-06-30 00:00:51 +02002217 return "<$tag class=\"author\">" .
e133d65c
SB
Stephen Boyd2009-10-15 21:14:59 -07002218 format_search_author($co->{'author_name'}, "author",
2219 git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2220 $author) .
2221 "</$tag>";
1c49a4e1
GB
Giuseppe Bilotta2009-06-30 00:00:48 +02002222}
2223
90921740
JN
Jakub Narębski2007-06-08 13:27:42 +02002224# format git diff header line, i.e. "diff --(git|combined|cc) ..."
2225sub format_git_diff_header_line {
2226 my $line = shift;
2227 my $diffinfo = shift;
2228 my ($from, $to) = @_;
2229
2230 if ($diffinfo->{'nparents'}) {
2231 # combined diff
2232 $line =~ s!^(diff (.*?) )"?.*$!$1!;
2233 if ($to->{'href'}) {
2234 $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2235 esc_path($to->{'file'}));
2236 } else { # file was deleted (no href)
2237 $line .= esc_path($to->{'file'});
2238 }
2239 } else {
2240 # "ordinary" diff
2241 $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2242 if ($from->{'href'}) {
2243 $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2244 'a/' . esc_path($from->{'file'}));
2245 } else { # file was added (no href)
2246 $line .= 'a/' . esc_path($from->{'file'});
2247 }
2248 $line .= ' ';
2249 if ($to->{'href'}) {
2250 $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2251 'b/' . esc_path($to->{'file'}));
2252 } else { # file was deleted
2253 $line .= 'b/' . esc_path($to->{'file'});
2254 }
2255 }
2256
2257 return "<div class=\"diff header\">$line</div>\n";
2258}
2259
2260# format extended diff header line, before patch itself
2261sub format_extended_diff_header_line {
2262 my $line = shift;
2263 my $diffinfo = shift;
2264 my ($from, $to) = @_;
2265
2266 # match <path>
2267 if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2268 $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2269 esc_path($from->{'file'}));
2270 }
2271 if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2272 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2273 esc_path($to->{'file'}));
2274 }
2275 # match single <mode>
2276 if ($line =~ m/\s(\d{6})$/) {
2277 $line .= '<span class="info"> (' .
2278 file_type_long($1) .
2279 ')</span>';
2280 }
2281 # match <hash>
2282 if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2283 # can match only for combined diff
2284 $line = 'index ';
2285 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2286 if ($from->{'href'}[$i]) {
2287 $line .= $cgi->a({-href=>$from->{'href'}[$i],
2288 -class=>"hash"},
2289 substr($diffinfo->{'from_id'}[$i],0,7));
2290 } else {
2291 $line .= '0' x 7;
2292 }
2293 # separator
2294 $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2295 }
2296 $line .= '..';
2297 if ($to->{'href'}) {
2298 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2299 substr($diffinfo->{'to_id'},0,7));
2300 } else {
2301 $line .= '0' x 7;
2302 }
2303
2304 } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2305 # can match only for ordinary diff
2306 my ($from_link, $to_link);
2307 if ($from->{'href'}) {
2308 $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2309 substr($diffinfo->{'from_id'},0,7));
2310 } else {
2311 $from_link = '0' x 7;
2312 }
2313 if ($to->{'href'}) {
2314 $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2315 substr($diffinfo->{'to_id'},0,7));
2316 } else {
2317 $to_link = '0' x 7;
2318 }
2319 my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2320 $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2321 }
2322
2323 return $line . "<br/>\n";
2324}
2325
2326# format from-file/to-file diff header
2327sub format_diff_from_to_header {
91af4ce4 Jakub Narębski2007-06-08 13:32:44 +02002328 my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
90921740
JN
Jakub Narębski2007-06-08 13:27:42 +02002329 my $line;
2330 my $result = '';
2331
2332 $line = $from_line;
2333 #assert($line =~ m/^---/) if DEBUG;
deaa01a9
JN
Jakub Narębski2007-06-08 13:29:49 +02002334 # no extra formatting for "^--- /dev/null"
2335 if (! $diffinfo->{'nparents'}) {
2336 # ordinary (single parent) diff
2337 if ($line =~ m!^--- "?a/!) {
2338 if ($from->{'href'}) {
2339 $line = '--- a/' .
2340 $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2341 esc_path($from->{'file'}));
2342 } else {
2343 $line = '--- a/' .
2344 esc_path($from->{'file'});
2345 }
2346 }
2347 $result .= qq!<div class="diff from_file">$line</div>\n!;
2348
2349 } else {
2350 # combined diff (merge commit)
2351 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2352 if ($from->{'href'}[$i]) {
2353 $line = '--- ' .
91af4ce4
JN
Jakub Narębski2007-06-08 13:32:44 +02002354 $cgi->a({-href=>href(action=>"blobdiff",
2355 hash_parent=>$diffinfo->{'from_id'}[$i],
2356 hash_parent_base=>$parents[$i],
2357 file_parent=>$from->{'file'}[$i],
2358 hash=>$diffinfo->{'to_id'},
2359 hash_base=>$hash,
2360 file_name=>$to->{'file'}),
2361 -class=>"path",
2362 -title=>"diff" . ($i+1)},
2363 $i+1) .
2364 '/' .
deaa01a9
JN
Jakub Narębski2007-06-08 13:29:49 +02002365 $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2366 esc_path($from->{'file'}[$i]));
2367 } else {
2368 $line = '--- /dev/null';
2369 }
2370 $result .= qq!<div class="diff from_file">$line</div>\n!;
90921740
JN
Jakub Narębski2007-06-08 13:27:42 +02002371 }
2372 }
90921740
JN
Jakub Narębski2007-06-08 13:27:42 +02002373
2374 $line = $to_line;
2375 #assert($line =~ m/^\+\+\+/) if DEBUG;
2376 # no extra formatting for "^+++ /dev/null"
2377 if ($line =~ m!^\+\+\+ "?b/!) {
2378 if ($to->{'href'}) {
2379 $line = '+++ b/' .
2380 $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2381 esc_path($to->{'file'}));
2382 } else {
2383 $line = '+++ b/' .
2384 esc_path($to->{'file'});
2385 }
2386 }
2387 $result .= qq!<div class="diff to_file">$line</div>\n!;
2388
2389 return $result;
2390}
2391
cd030c3a
JN
Jakub Narębski2007-06-08 13:33:28 +02002392# create note for patch simplified by combined diff
2393sub format_diff_cc_simplified {
2394 my ($diffinfo, @parents) = @_;
2395 my $result = '';
2396
2397 $result .= "<div class=\"diff header\">" .
2398 "diff --cc ";
2399 if (!is_deleted($diffinfo)) {
2400 $result .= $cgi->a({-href => href(action=>"blob",
2401 hash_base=>$hash,
2402 hash=>$diffinfo->{'to_id'},
2403 file_name=>$diffinfo->{'to_file'}),
2404 -class => "path"},
2405 esc_path($diffinfo->{'to_file'}));
2406 } else {
2407 $result .= esc_path($diffinfo->{'to_file'});
2408 }
2409 $result .= "</div>\n" . # class="diff header"
2410 "<div class=\"diff nodifferences\">" .
2411 "Simple merge" .
2412 "</div>\n"; # class="diff nodifferences"
2413
2414 return $result;
2415}
2416
20a864cd
JN
Jakub Narębski2011-10-31 00:36:20 +01002417sub diff_line_class {
2418 my ($line, $from, $to) = @_;
2419
2420 # ordinary diff
2421 my $num_sign = 1;
2422 # combined diff
2423 if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2424 $num_sign = scalar @{$from->{'href'}};
2425 }
2426
2427 my @diff_line_classifier = (
2428 { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2429 { regexp => qr/^\\/, class => "incomplete" },
2430 { regexp => qr/^ {$num_sign}/, class => "ctx" },
2431 # classifier for context must come before classifier add/rem,
2432 # or we would have to use more complicated regexp, for example
2433 # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2434 { regexp => qr/^[+ ]{$num_sign}/, class => "add" },
2435 { regexp => qr/^[- ]{$num_sign}/, class => "rem" },
2436 );
2437 for my $clsfy (@diff_line_classifier) {
2438 return $clsfy->{'class'}
2439 if ($line =~ $clsfy->{'regexp'});
2440 }
2441
2442 # fallback
2443 return "";
2444}
2445
f1310cf5
JN
Jakub Narębski2011-10-31 00:36:21 +01002446# assumes that $from and $to are defined and correctly filled,
2447# and that $line holds a line of chunk header for unified diff
2448sub format_unidiff_chunk_header {
2449 my ($line, $from, $to) = @_;
2450
2451 my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2452 $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2453
2454 $from_lines = 0 unless defined $from_lines;
2455 $to_lines = 0 unless defined $to_lines;
2456
2457 if ($from->{'href'}) {
2458 $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2459 -class=>"list"}, $from_text);
2460 }
2461 if ($to->{'href'}) {
2462 $to_text = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2463 -class=>"list"}, $to_text);
2464 }
2465 $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2466 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2467 return $line;
2468}
2469
2470# assumes that $from and $to are defined and correctly filled,
2471# and that $line holds a line of chunk header for combined diff
2472sub format_cc_diff_chunk_header {
2473 my ($line, $from, $to) = @_;
2474
2475 my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2476 my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2477
2478 @from_text = split(' ', $ranges);
2479 for (my $i = 0; $i < @from_text; ++$i) {
2480 ($from_start[$i], $from_nlines[$i]) =
2481 (split(',', substr($from_text[$i], 1)), 0);
2482 }
2483
2484 $to_text = pop @from_text;
2485 $to_start = pop @from_start;
2486 $to_nlines = pop @from_nlines;
2487
2488 $line = "<span class=\"chunk_info\">$prefix ";
2489 for (my $i = 0; $i < @from_text; ++$i) {
2490 if ($from->{'href'}[$i]) {
2491 $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2492 -class=>"list"}, $from_text[$i]);
2493 } else {
2494 $line .= $from_text[$i];
2495 }
2496 $line .= " ";
2497 }
2498 if ($to->{'href'}) {
2499 $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2500 -class=>"list"}, $to_text);
2501 } else {
2502 $line .= $to_text;
2503 }
2504 $line .= " $prefix</span>" .
2505 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2506 return $line;
2507}
2508
6ba1eb51 Kato Kazuyoshi2011-10-31 00:36:22 +01002509# process patch (diff) line (not to be used for diff headers),
5fb6ddf6
MK
Michał Kiedrowicz2012-04-11 23:18:43 +02002510# returning HTML-formatted (but not wrapped) line.
2511# If the line is passed as a reference, it is treated as HTML and not
2512# esc_html()'ed.
f4a81026
MK
Michał Kiedrowicz2012-04-11 23:18:42 +02002513sub format_diff_line {
2514 my ($line, $diff_class, $from, $to) = @_;
eee08903 Jakub Narębski2006-08-24 00:15:14 +02002515
5fb6ddf6
MK
Michał Kiedrowicz2012-04-11 23:18:43 +02002516 if (ref($line)) {
2517 $line = $$line;
f4a81026 Michał Kiedrowicz2012-04-11 23:18:42 +02002518 } else {
5fb6ddf6
MK
Michał Kiedrowicz2012-04-11 23:18:43 +02002519 chomp $line;
2520 $line = untabify($line);
20a864cd Jakub Narębski2011-10-31 00:36:20 +01002521
5fb6ddf6
MK
Michał Kiedrowicz2012-04-11 23:18:43 +02002522 if ($from && $to && $line =~ m/^\@{2} /) {
2523 $line = format_unidiff_chunk_header($line, $from, $to);
2524 } elsif ($from && $to && $line =~ m/^\@{3}/) {
2525 $line = format_cc_diff_chunk_header($line, $from, $to);
2526 } else {
2527 $line = esc_html($line, -nbsp=>1);
2528 }
59e3b14e Jakub Narębski2006-11-18 23:35:40 +01002529 }
e72c0eaf Jakub Narębski2007-05-07 01:10:05 +02002530
f4a81026
MK
Michał Kiedrowicz2012-04-11 23:18:42 +02002531 my $diff_classes = "diff";
2532 $diff_classes .= " $diff_class" if ($diff_class);
2533 $line = "<div class=\"$diff_classes\">$line</div>\n";
f1310cf5 Jakub Narębski2011-10-31 00:36:21 +01002534
f4a81026 Michał Kiedrowicz2012-04-11 23:18:42 +02002535 return $line;
eee08903
JN
Jakub Narębski2006-08-24 00:15:14 +02002536}
2537
a3c8ab30
MM
Matt McCutchen2007-07-22 01:30:27 +02002538# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2539# linked. Pass the hash of the tree/commit to snapshot.
2540sub format_snapshot_links {
2541 my ($hash) = @_;
a3c8ab30
MM
Matt McCutchen2007-07-22 01:30:27 +02002542 my $num_fmts = @snapshot_fmts;
2543 if ($num_fmts > 1) {
2544 # A parenthesized list of links bearing format names.
a781785d Jakub Narębski2007-07-22 23:41:20 +02002545 # e.g. "snapshot (_tar.gz_ _zip_)"
a3c8ab30
MM
Matt McCutchen2007-07-22 01:30:27 +02002546 return "snapshot (" . join(' ', map
2547 $cgi->a({
2548 -href => href(
2549 action=>"snapshot",
2550 hash=>$hash,
2551 snapshot_format=>$_
2552 )
2553 }, $known_snapshot_formats{$_}{'display'})
2554 , @snapshot_fmts) . ")";
2555 } elsif ($num_fmts == 1) {
2556 # A single "snapshot" link whose tooltip bears the format name.
a781785d Jakub Narębski2007-07-22 23:41:20 +02002557 # i.e. "_snapshot_"
a3c8ab30 Matt McCutchen2007-07-22 01:30:27 +02002558 my ($fmt) = @snapshot_fmts;
a781785d
JN
Jakub Narębski2007-07-22 23:41:20 +02002559 return
2560 $cgi->a({
a3c8ab30
MM
Matt McCutchen2007-07-22 01:30:27 +02002561 -href => href(
2562 action=>"snapshot",
2563 hash=>$hash,
2564 snapshot_format=>$fmt
2565 ),
2566 -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2567 }, "snapshot");
2568 } else { # $num_fmts == 0
2569 return undef;
2570 }
2571}
2572
3562198b
JN
Jakub Narębski2008-04-20 22:09:48 +02002573## ......................................................................
2574## functions returning values to be passed, perhaps after some
2575## transformation, to other functions; e.g. returning arguments to href()
2576
2577# returns hash to be passed to href to generate gitweb URL
2578# in -title key it returns description of link
2579sub get_feed_info {
2580 my $format = shift || 'Atom';
2581 my %res = (action => lc($format));
8d646a9b Krzesimir Nowak2013-12-11 12:54:43 +01002582 my $matched_ref = 0;
3562198b
JN
Jakub Narębski2008-04-20 22:09:48 +02002583
2584 # feed links are possible only for project views
2585 return unless (defined $project);
2586 # some views should link to OPML, or to generic project feed,
2587 # or don't have specific feed yet (so they should use generic)
18ab83e8 Jakub Narębski2012-01-07 11:47:38 +01002588 return if (!$action || $action =~ /^(?:tags|heads|forks|tag|search)$/x);
3562198b Jakub Narębski2008-04-20 22:09:48 +02002589
8d646a9b
KN
Krzesimir Nowak2013-12-11 12:54:43 +01002590 my $branch = undef;
2591 # branches refs uses 'refs/' + $get_branch_refs()[x] + '/' prefix
2592 # (fullname) to differentiate from tag links; this also makes
2593 # possible to detect branch links
2594 for my $ref (get_branch_refs()) {
2595 if ((defined $hash_base && $hash_base =~ m!^refs/\Q$ref\E/(.*)$!) ||
2596 (defined $hash && $hash =~ m!^refs/\Q$ref\E/(.*)$!)) {
2597 $branch = $1;
2598 $matched_ref = $ref;
2599 last;
2600 }
3562198b
JN
Jakub Narębski2008-04-20 22:09:48 +02002601 }
2602 # find log type for feed description (title)
2603 my $type = 'log';
2604 if (defined $file_name) {
2605 $type = "history of $file_name";
2606 $type .= "/" if ($action eq 'tree');
2607 $type .= " on '$branch'" if (defined $branch);
2608 } else {
2609 $type = "log of $branch" if (defined $branch);
2610 }
2611
2612 $res{-title} = $type;
8d646a9b Krzesimir Nowak2013-12-11 12:54:43 +01002613 $res{'hash'} = (defined $branch ? "refs/$matched_ref/$branch" : undef);
3562198b
JN
Jakub Narębski2008-04-20 22:09:48 +02002614 $res{'file_name'} = $file_name;
2615
2616 return %res;
2617}
2618
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02002619## ----------------------------------------------------------------------
2620## git utility subroutines, invoking git commands
42f7eb94 Kay Sievers2005-08-07 20:21:46 +02002621
25691fbe
DS
Dennis Stosberg2006-08-28 17:49:58 +02002622# returns path to the core git executable and the --git-dir parameter as list
2623sub git_cmd {
aa7dd05e Jakub Narębski2009-09-01 13:39:16 +02002624 $number_of_git_cmds++;
25691fbe
DS
Dennis Stosberg2006-08-28 17:49:58 +02002625 return $GIT, '--git-dir='.$git_dir;
2626}
2627
516381d5
LW
Lea Wiemann2008-06-17 23:46:35 +02002628# quote the given arguments for passing them to the shell
2629# quote_command("command", "arg 1", "arg with ' and ! characters")
2630# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2631# Try to avoid using this function wherever possible.
2632sub quote_command {
2633 return join(' ',
68cedb1f Jakub Narębski2009-05-10 02:40:37 +02002634 map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
25691fbe
DS
Dennis Stosberg2006-08-28 17:49:58 +02002635}
2636
717b8311 Jakub Narębski2006-07-31 21:22:15 +02002637# get HEAD ref of given project as hash
847e01fb Jakub Narębski2006-08-14 02:05:47 +02002638sub git_get_head_hash {
b629275f
MR
Mark Rada2009-11-07 16:13:29 +01002639 return git_get_full_hash(shift, 'HEAD');
2640}
2641
2642sub git_get_full_hash {
2643 return git_get_hash(@_);
2644}
2645
2646sub git_get_short_hash {
2647 return git_get_hash(@_, '--short=7');
2648}
2649
2650sub git_get_hash {
2651 my ($project, $hash, @options) = @_;
25691fbe Dennis Stosberg2006-08-28 17:49:58 +02002652 my $o_git_dir = $git_dir;
df2c37a5 Junio C Hamano2006-01-09 13:13:39 +01002653 my $retval = undef;
25691fbe Dennis Stosberg2006-08-28 17:49:58 +02002654 $git_dir = "$projectroot/$project";
b629275f
MR
Mark Rada2009-11-07 16:13:29 +01002655 if (open my $fd, '-|', git_cmd(), 'rev-parse',
2656 '--verify', '-q', @options, $hash) {
2657 $retval = <$fd>;
2658 chomp $retval if defined $retval;
df2c37a5 Junio C Hamano2006-01-09 13:13:39 +01002659 close $fd;
df2c37a5 Junio C Hamano2006-01-09 13:13:39 +01002660 }
25691fbe
DS
Dennis Stosberg2006-08-28 17:49:58 +02002661 if (defined $o_git_dir) {
2662 $git_dir = $o_git_dir;
2c5c008b Kay Sievers2006-01-17 03:50:20 +01002663 }
df2c37a5
JH
Junio C Hamano2006-01-09 13:13:39 +01002664 return $retval;
2665}
2666
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02002667# get type of given object
2668sub git_get_type {
2669 my $hash = shift;
2670
25691fbe Dennis Stosberg2006-08-28 17:49:58 +02002671 open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02002672 my $type = <$fd>;
2673 close $fd or return;
2674 chomp $type;
2675 return $type;
2676}
2677
b201927a
JN
Jakub Narębski2007-11-03 00:41:19 +01002678# repository configuration
2679our $config_file = '';
2680our %config;
2681
2682# store multiple values for single key as anonymous array reference
2683# single values stored directly in the hash, not as [ <value> ]
2684sub hash_set_multi {
2685 my ($hash, $key, $value) = @_;
2686
2687 if (!exists $hash->{$key}) {
2688 $hash->{$key} = $value;
2689 } elsif (!ref $hash->{$key}) {
2690 $hash->{$key} = [ $hash->{$key}, $value ];
2691 } else {
2692 push @{$hash->{$key}}, $value;
2693 }
2694}
2695
2696# return hash of git project configuration
2697# optionally limited to some section, e.g. 'gitweb'
2698sub git_parse_project_config {
2699 my $section_regexp = shift;
2700 my %config;
2701
2702 local $/ = "\0";
2703
2704 open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2705 or return;
2706
2707 while (my $keyval = <$fh>) {
2708 chomp $keyval;
2709 my ($key, $value) = split(/\n/, $keyval, 2);
2710
2711 hash_set_multi(\%config, $key, $value)
2712 if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2713 }
2714 close $fh;
2715
2716 return %config;
2717}
2718
df5d10a3 Marcel M. Cary2009-02-18 14:09:41 +01002719# convert config value to boolean: 'true' or 'false'
b201927a
JN
Jakub Narębski2007-11-03 00:41:19 +01002720# no value, number > 0, 'true' and 'yes' values are true
2721# rest of values are treated as false (never as error)
2722sub config_to_bool {
2723 my $val = shift;
2724
df5d10a3
MC
Marcel M. Cary2009-02-18 14:09:41 +01002725 return 1 if !defined $val; # section.key
2726
b201927a
JN
Jakub Narębski2007-11-03 00:41:19 +01002727 # strip leading and trailing whitespace
2728 $val =~ s/^\s+//;
2729 $val =~ s/\s+$//;
2730
df5d10a3 Marcel M. Cary2009-02-18 14:09:41 +01002731 return (($val =~ /^\d+$/ && $val) || # section.key = 1
b201927a
JN
Jakub Narębski2007-11-03 00:41:19 +01002732 ($val =~ /^(?:true|yes)$/i)); # section.key = true
2733}
2734
2735# convert config value to simple decimal number
2736# an optional value suffix of 'k', 'm', or 'g' will cause the value
2737# to be multiplied by 1024, 1048576, or 1073741824
2738sub config_to_int {
2739 my $val = shift;
2740
2741 # strip leading and trailing whitespace
2742 $val =~ s/^\s+//;
2743 $val =~ s/\s+$//;
2744
2745 if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2746 $unit = lc($unit);
2747 # unknown unit is treated as 1
2748 return $num * ($unit eq 'g' ? 1073741824 :
2749 $unit eq 'm' ? 1048576 :
2750 $unit eq 'k' ? 1024 : 1);
2751 }
2752 return $val;
2753}
2754
2755# convert config value to array reference, if needed
2756sub config_to_multi {
2757 my $val = shift;
2758
d76a585d Jakub Narębski2007-12-20 10:48:09 +01002759 return ref($val) ? $val : (defined($val) ? [ $val ] : []);
b201927a
JN
Jakub Narębski2007-11-03 00:41:19 +01002760}
2761
717b8311 Jakub Narębski2006-07-31 21:22:15 +02002762sub git_get_project_config {
ddb8d900 Aneesh Kumar K.V2006-08-20 11:53:04 +05302763 my ($key, $type) = @_;
717b8311 Jakub Narębski2006-07-31 21:22:15 +02002764
7a49c254 Jakub Narębski2010-03-27 20:26:59 +01002765 return unless defined $git_dir;
9be3614e Jakub Narębski2010-03-01 22:51:34 +01002766
b201927a Jakub Narębski2007-11-03 00:41:19 +01002767 # key sanity check
717b8311 Jakub Narębski2006-07-31 21:22:15 +02002768 return unless ($key);
14569cd8
JN
Jakub Narębski2011-07-28 23:38:03 +02002769 # only subsection, if exists, is case sensitive,
2770 # and not lowercased by 'git config -z -l'
2771 if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
af507944 Phil Pennock2012-11-05 18:50:47 -05002772 $lo =~ s/_//g;
14569cd8 Jakub Narębski2011-07-28 23:38:03 +02002773 $key = join(".", lc($hi), $mi, lc($lo));
af507944 Phil Pennock2012-11-05 18:50:47 -05002774 return if ($lo =~ /\W/ || $hi =~ /\W/);
14569cd8
JN
Jakub Narębski2011-07-28 23:38:03 +02002775 } else {
2776 $key = lc($key);
af507944
PP
Phil Pennock2012-11-05 18:50:47 -05002777 $key =~ s/_//g;
2778 return if ($key =~ /\W/);
14569cd8 Jakub Narębski2011-07-28 23:38:03 +02002779 }
717b8311 Jakub Narębski2006-07-31 21:22:15 +02002780 $key =~ s/^gitweb\.//;
717b8311 Jakub Narębski2006-07-31 21:22:15 +02002781
b201927a
JN
Jakub Narębski2007-11-03 00:41:19 +01002782 # type sanity check
2783 if (defined $type) {
2784 $type =~ s/^--//;
2785 $type = undef
2786 unless ($type eq 'bool' || $type eq 'int');
2787 }
2788
2789 # get config
2790 if (!defined $config_file ||
2791 $config_file ne "$git_dir/config") {
2792 %config = git_parse_project_config('gitweb');
2793 $config_file = "$git_dir/config";
2794 }
2795
df5d10a3
MC
Marcel M. Cary2009-02-18 14:09:41 +01002796 # check if config variable (key) exists
2797 return unless exists $config{"gitweb.$key"};
2798
b201927a
JN
Jakub Narębski2007-11-03 00:41:19 +01002799 # ensure given type
2800 if (!defined $type) {
2801 return $config{"gitweb.$key"};
2802 } elsif ($type eq 'bool') {
2803 # backward compatibility: 'git config --bool' returns true/false
2804 return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2805 } elsif ($type eq 'int') {
2806 return config_to_int($config{"gitweb.$key"});
2807 }
2808 return $config{"gitweb.$key"};
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02002809}
2810
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02002811# get hash of given path at given ref
2812sub git_get_hash_by_path {
2813 my $base = shift;
2814 my $path = shift || return undef;
1d782b03 Jakub Narębski2006-09-21 18:09:12 +02002815 my $type = shift;
717b8311 Jakub Narębski2006-07-31 21:22:15 +02002816
4b02f483 Jakub Narębski2006-09-26 01:54:24 +02002817 $path =~ s,/+$,,;
717b8311 Jakub Narębski2006-07-31 21:22:15 +02002818
25691fbe Dennis Stosberg2006-08-28 17:49:58 +02002819 open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
074afaa0 Lea Wiemann2008-06-19 22:03:21 +02002820 or die_error(500, "Open git-ls-tree failed");
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02002821 my $line = <$fd>;
2822 close $fd or return undef;
2823
198a2a8a
JN
Jakub Narębski2007-05-12 21:16:34 +02002824 if (!defined $line) {
2825 # there is no tree or hash given by $path at $base
2826 return undef;
2827 }
2828
717b8311 Jakub Narębski2006-07-31 21:22:15 +02002829 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa panic.c'
8b4b94cc Jakub Narębski2006-10-30 22:25:11 +01002830 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
1d782b03
JN
Jakub Narębski2006-09-21 18:09:12 +02002831 if (defined $type && $type ne $2) {
2832 # type doesn't match
2833 return undef;
2834 }
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02002835 return $3;
2836}
2837
ed224dea
JN
Jakub Narębski2007-05-07 01:10:04 +02002838# get path of entry with given hash at given tree-ish (ref)
2839# used to get 'from' filename for combined diff (merge commit) for renames
2840sub git_get_path_by_hash {
2841 my $base = shift || return;
2842 my $hash = shift || return;
2843
2844 local $/ = "\0";
2845
2846 open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2847 or return undef;
2848 while (my $line = <$fd>) {
2849 chomp $line;
2850
2851 #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423 gitweb'
2852 #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f gitweb/README'
2853 if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2854 close $fd;
2855 return $1;
2856 }
2857 }
2858 close $fd;
2859 return undef;
2860}
2861
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02002862## ......................................................................
2863## git utility functions, directly accessing git repository
2864
e4e3b32b
SC
Sebastien Cevey2011-04-29 19:52:00 +02002865# get the value of config variable either from file named as the variable
2866# itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2867# configuration variable in the repository config file.
2868sub git_get_file_or_project_config {
2869 my ($path, $name) = @_;
09bd7898 Kay Sievers2005-08-07 20:21:23 +02002870
0e121a2c Jakub Narębski2007-11-03 00:41:20 +01002871 $git_dir = "$projectroot/$path";
e4e3b32b
SC
Sebastien Cevey2011-04-29 19:52:00 +02002872 open my $fd, '<', "$git_dir/$name"
2873 or return git_get_project_config($name);
2874 my $conf = <$fd>;
b87d78d6 Kay Sievers2005-08-07 20:21:04 +02002875 close $fd;
e4e3b32b
SC
Sebastien Cevey2011-04-29 19:52:00 +02002876 if (defined $conf) {
2877 chomp $conf;
2eb54efc Junio C Hamano2007-05-16 21:04:16 -07002878 }
e4e3b32b
SC
Sebastien Cevey2011-04-29 19:52:00 +02002879 return $conf;
2880}
2881
2882sub git_get_project_description {
2883 my $path = shift;
2884 return git_get_file_or_project_config($path, 'description');
12a88f2f
KS
Kay Sievers2005-08-07 20:02:47 +02002885}
2886
d940c901
SC
Sebastien Cevey2011-04-29 19:52:01 +02002887sub git_get_project_category {
2888 my $path = shift;
2889 return git_get_file_or_project_config($path, 'category');
12a88f2f
KS
Kay Sievers2005-08-07 20:02:47 +02002890}
2891
d940c901 Sebastien Cevey2011-04-29 19:52:01 +02002892
0368c492
JN
Jakub Narębski2011-04-29 19:51:57 +02002893# supported formats:
2894# * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2895# - if its contents is a number, use it as tag weight,
2896# - otherwise add a tag with weight 1
2897# * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2898# the same value multiple times increases tag weight
2899# * `gitweb.ctag' multi-valued repo config variable
aed93de4 Petr Baudis2008-10-02 17:13:02 +02002900sub git_get_project_ctags {
0368c492 Jakub Narębski2011-04-29 19:51:57 +02002901 my $project = shift;
aed93de4
PB
Petr Baudis2008-10-02 17:13:02 +02002902 my $ctags = {};
2903
0368c492
JN
Jakub Narębski2011-04-29 19:51:57 +02002904 $git_dir = "$projectroot/$project";
2905 if (opendir my $dh, "$git_dir/ctags") {
2906 my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2907 foreach my $tagfile (@files) {
2908 open my $ct, '<', $tagfile
2909 or next;
2910 my $val = <$ct>;
2911 chomp $val if $val;
2912 close $ct;
2913
2914 (my $ctag = $tagfile) =~ s#.*/##;
2c162b56 Jonathan Nieder2011-06-09 02:08:57 -05002915 if ($val =~ /^\d+$/) {
0368c492
JN
Jakub Narębski2011-04-29 19:51:57 +02002916 $ctags->{$ctag} = $val;
2917 } else {
2918 $ctags->{$ctag} = 1;
2919 }
2920 }
2921 closedir $dh;
2922
2923 } elsif (open my $fh, '<', "$git_dir/ctags") {
2924 while (my $line = <$fh>) {
2925 chomp $line;
2926 $ctags->{$line}++ if $line;
2927 }
2928 close $fh;
2929
2930 } else {
2931 my $taglist = config_to_multi(git_get_project_config('ctag'));
2932 foreach my $tag (@$taglist) {
2933 $ctags->{$tag}++;
2934 }
aed93de4 Petr Baudis2008-10-02 17:13:02 +02002935 }
0368c492
JN
Jakub Narębski2011-04-29 19:51:57 +02002936
2937 return $ctags;
2938}
2939
2940# return hash, where keys are content tags ('ctags'),
2941# and values are sum of weights of given tag in every project
2942sub git_gather_all_ctags {
2943 my $projects = shift;
2944 my $ctags = {};
2945
2946 foreach my $p (@$projects) {
2947 foreach my $ct (keys %{$p->{'ctags'}}) {
2948 $ctags->{$ct} += $p->{'ctags'}->{$ct};
2949 }
aed93de4 Petr Baudis2008-10-02 17:13:02 +02002950 }
0368c492
JN
Jakub Narębski2011-04-29 19:51:57 +02002951
2952 return $ctags;
aed93de4
PB
Petr Baudis2008-10-02 17:13:02 +02002953}
2954
2955sub git_populate_project_tagcloud {
2956 my $ctags = shift;
2957
2958 # First, merge different-cased tags; tags vote on casing
2959 my %ctags_lc;
2960 foreach (keys %$ctags) {
2961 $ctags_lc{lc $_}->{count} += $ctags->{$_};
2962 if (not $ctags_lc{lc $_}->{topcount}
2963 or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2964 $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2965 $ctags_lc{lc $_}->{topname} = $_;
2966 }
2967 }
2968
2969 my $cloud;
84d9e2d5 Jakub Narębski2012-02-03 13:44:54 +01002970 my $matched = $input_params{'ctag'};
aed93de4
PB
Petr Baudis2008-10-02 17:13:02 +02002971 if (eval { require HTML::TagCloud; 1; }) {
2972 $cloud = HTML::TagCloud->new;
0368c492 Jakub Narębski2011-04-29 19:51:57 +02002973 foreach my $ctag (sort keys %ctags_lc) {
aed93de4
PB
Petr Baudis2008-10-02 17:13:02 +02002974 # Pad the title with spaces so that the cloud looks
2975 # less crammed.
0368c492 Jakub Narębski2011-04-29 19:51:57 +02002976 my $title = esc_html($ctags_lc{$ctag}->{topname});
aed93de4
PB
Petr Baudis2008-10-02 17:13:02 +02002977 $title =~ s/ /&nbsp;/g;
2978 $title =~ s/^/&nbsp;/g;
2979 $title =~ s/$/&nbsp;/g;
4b9447f9
JN
Jakub Narębski2011-04-29 19:51:58 +02002980 if (defined $matched && $matched eq $ctag) {
2981 $title = qq(<span class="match">$title</span>);
2982 }
0368c492
JN
Jakub Narębski2011-04-29 19:51:57 +02002983 $cloud->add($title, href(project=>undef, ctag=>$ctag),
2984 $ctags_lc{$ctag}->{count});
aed93de4
PB
Petr Baudis2008-10-02 17:13:02 +02002985 }
2986 } else {
0368c492
JN
Jakub Narębski2011-04-29 19:51:57 +02002987 $cloud = {};
2988 foreach my $ctag (keys %ctags_lc) {
4b9447f9
JN
Jakub Narębski2011-04-29 19:51:58 +02002989 my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2990 if (defined $matched && $matched eq $ctag) {
2991 $title = qq(<span class="match">$title</span>);
2992 }
0368c492
JN
Jakub Narębski2011-04-29 19:51:57 +02002993 $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2994 $cloud->{$ctag}{ctag} =
4b9447f9 Jakub Narębski2011-04-29 19:51:58 +02002995 $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
0368c492 Jakub Narębski2011-04-29 19:51:57 +02002996 }
aed93de4 Petr Baudis2008-10-02 17:13:02 +02002997 }
0368c492 Jakub Narębski2011-04-29 19:51:57 +02002998 return $cloud;
aed93de4
PB
Petr Baudis2008-10-02 17:13:02 +02002999}
3000
3001sub git_show_project_tagcloud {
3002 my ($cloud, $count) = @_;
aed93de4
PB
Petr Baudis2008-10-02 17:13:02 +02003003 if (ref $cloud eq 'HTML::TagCloud') {
3004 return $cloud->html_and_css($count);
3005 } else {
0368c492
JN
Jakub Narębski2011-04-29 19:51:57 +02003006 my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
3007 return
3008 '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
3009 join (', ', map {
3010 $cloud->{$_}->{'ctag'}
3011 } splice(@tags, 0, $count)) .
3012 '</div>';
aed93de4
PB
Petr Baudis2008-10-02 17:13:02 +02003013 }
3014}
3015
e79ca7cc
JN
Jakub Narębski2006-08-16 14:50:34 +02003016sub git_get_project_url_list {
3017 my $path = shift;
3018
0e121a2c Jakub Narębski2007-11-03 00:41:20 +01003019 $git_dir = "$projectroot/$path";
dff2b6d4 Jakub Narębski2009-05-10 02:38:34 +02003020 open my $fd, '<', "$git_dir/cloneurl"
0e121a2c
JN
Jakub Narębski2007-11-03 00:41:20 +01003021 or return wantarray ?
3022 @{ config_to_multi(git_get_project_config('url')) } :
3023 config_to_multi(git_get_project_config('url'));
e79ca7cc
JN
Jakub Narębski2006-08-16 14:50:34 +02003024 my @git_project_url_list = map { chomp; $_ } <$fd>;
3025 close $fd;
3026
3027 return wantarray ? @git_project_url_list : \@git_project_url_list;
3028}
3029
847e01fb Jakub Narębski2006-08-14 02:05:47 +02003030sub git_get_projects_list {
12b1443c Jakub Narębski2011-04-29 19:51:56 +02003031 my $filter = shift || '';
348a6589 Bernhard R. Link2012-01-30 21:06:38 +01003032 my $paranoid = shift;
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02003033 my @list;
3034
3035 if (-d $projects_list) {
3036 # search in directory
12b1443c Jakub Narębski2011-04-29 19:51:56 +02003037 my $dir = $projects_list;
6768d6b8
AK
Aneesh Kumar K.V2006-11-03 10:41:45 +05303038 # remove the trailing "/"
3039 $dir =~ s!/+$!!;
ac593b76
MM
Matthieu Moy2012-01-04 11:07:45 +01003040 my $pfxlen = length("$dir");
3041 my $pfxdepth = ($dir =~ tr!/!!);
12b1443c Jakub Narębski2011-04-29 19:51:56 +02003042 # when filtering, search only given subdirectory
348a6589 Bernhard R. Link2012-01-30 21:06:38 +01003043 if ($filter && !$paranoid) {
12b1443c
JN
Jakub Narębski2011-04-29 19:51:56 +02003044 $dir .= "/$filter";
3045 $dir =~ s!/+$!!;
3046 }
c0011ff8
JN
Jakub Narębski2006-09-14 22:18:59 +02003047
3048 File::Find::find({
3049 follow_fast => 1, # follow symbolic links
d20602ee Junio C Hamano2007-07-27 01:23:03 -07003050 follow_skip => 2, # ignore duplicates
c0011ff8
JN
Jakub Narębski2006-09-14 22:18:59 +02003051 dangling_symlinks => 0, # ignore dangling symlinks, silently
3052 wanted => sub {
ee1d8ee0
JN
Jakub Narębski2010-04-30 18:30:31 +02003053 # global variables
3054 our $project_maxdepth;
3055 our $projectroot;
c0011ff8
JN
Jakub Narębski2006-09-14 22:18:59 +02003056 # skip project-list toplevel, if we get it.
3057 return if (m!^[/.]$!);
3058 # only directories can be git repositories
3059 return unless (-d $_);
ca5e9495 Luke Lu2007-10-16 20:45:25 -07003060 # don't traverse too deep (Find is super slow on os x)
12b1443c Jakub Narębski2011-04-29 19:51:56 +02003061 # $project_maxdepth excludes depth of $projectroot
ca5e9495
LL
Luke Lu2007-10-16 20:45:25 -07003062 if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
3063 $File::Find::prune = 1;
3064 return;
3065 }
c0011ff8 Jakub Narębski2006-09-14 22:18:59 +02003066
12b1443c Jakub Narębski2011-04-29 19:51:56 +02003067 my $path = substr($File::Find::name, $pfxlen + 1);
348a6589
BL
Bernhard R. Link2012-01-30 21:06:38 +01003068 # paranoidly only filter here
3069 if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
3070 next;
3071 }
c0011ff8 Jakub Narębski2006-09-14 22:18:59 +02003072 # we check related file in $projectroot
fb3bb3d1
DD
Devin Doucette2008-12-27 02:39:31 -07003073 if (check_export_ok("$projectroot/$path")) {
3074 push @list, { path => $path };
c0011ff8
JN
Jakub Narębski2006-09-14 22:18:59 +02003075 $File::Find::prune = 1;
3076 }
3077 },
3078 }, "$dir");
3079
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02003080 } elsif (-f $projects_list) {
3081 # read from file(url-encoded):
3082 # 'git%2Fgit.git Linus+Torvalds'
3083 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3084 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
dff2b6d4 Jakub Narębski2009-05-10 02:38:34 +02003085 open my $fd, '<', $projects_list or return;
c2b8b134 Frank Lichtenheld2007-04-06 23:58:11 +02003086 PROJECT:
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02003087 while (my $line = <$fd>) {
3088 chomp $line;
3089 my ($path, $owner) = split ' ', $line;
3090 $path = unescape($path);
3091 $owner = unescape($owner);
3092 if (!defined $path) {
3093 next;
3094 }
12b1443c
JN
Jakub Narębski2011-04-29 19:51:56 +02003095 # if $filter is rpovided, check if $path begins with $filter
3096 if ($filter && $path !~ m!^\Q$filter\E/!) {
3097 next;
83ee94c1 Junio C Hamano2006-11-07 22:37:17 -08003098 }
2172ce4b Junio C Hamano2006-10-03 02:30:47 -07003099 if (check_export_ok("$projectroot/$path")) {
717b8311 Jakub Narębski2006-07-31 21:22:15 +02003100 my $pr = {
75e0dffe Kacper Kornet2012-04-24 19:50:05 +02003101 path => $path
717b8311 Jakub Narębski2006-07-31 21:22:15 +02003102 };
75e0dffe
KK
Kacper Kornet2012-04-24 19:50:05 +02003103 if ($owner) {
3104 $pr->{'owner'} = to_utf8($owner);
3105 }
c2b8b134 Frank Lichtenheld2007-04-06 23:58:11 +02003106 push @list, $pr;
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02003107 }
3108 }
3109 close $fd;
3110 }
717b8311
JN
Jakub Narębski2006-07-31 21:22:15 +02003111 return @list;
3112}
3113
12b1443c
JN
Jakub Narębski2011-04-29 19:51:56 +02003114# written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
3115# as side effects it sets 'forks' field to list of forks for forked projects
3116sub filter_forks_from_projects_list {
3117 my $projects = shift;
3118
3119 my %trie; # prefix tree of directories (path components)
3120 # generate trie out of those directories that might contain forks
3121 foreach my $pr (@$projects) {
3122 my $path = $pr->{'path'};
3123 $path =~ s/\.git$//; # forks of 'repo.git' are in 'repo/' directory
3124 next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
3125 next unless ($path); # skip '.git' repository: tests, git-instaweb
53c632fa Julien Muchembled2011-10-21 21:04:21 +02003126 next unless (-d "$projectroot/$path"); # containing directory exists
12b1443c
JN
Jakub Narębski2011-04-29 19:51:56 +02003127 $pr->{'forks'} = []; # there can be 0 or more forks of project
3128
3129 # add to trie
3130 my @dirs = split('/', $path);
3131 # walk the trie, until either runs out of components or out of trie
3132 my $ref = \%trie;
3133 while (scalar @dirs &&
3134 exists($ref->{$dirs[0]})) {
3135 $ref = $ref->{shift @dirs};
3136 }
3137 # create rest of trie structure from rest of components
3138 foreach my $dir (@dirs) {
3139 $ref = $ref->{$dir} = {};
3140 }
3141 # create end marker, store $pr as a data
3142 $ref->{''} = $pr if (!exists $ref->{''});
3143 }
3144
3145 # filter out forks, by finding shortest prefix match for paths
3146 my @filtered;
3147 PROJECT:
3148 foreach my $pr (@$projects) {
3149 # trie lookup
3150 my $ref = \%trie;
3151 DIR:
3152 foreach my $dir (split('/', $pr->{'path'})) {
3153 if (exists $ref->{''}) {
3154 # found [shortest] prefix, is a fork - skip it
3155 push @{$ref->{''}{'forks'}}, $pr;
3156 next PROJECT;
3157 }
3158 if (!exists $ref->{$dir}) {
3159 # not in trie, cannot have prefix, not a fork
3160 push @filtered, $pr;
3161 next PROJECT;
3162 }
3163 # If the dir is there, we just walk one step down the trie.
3164 $ref = $ref->{$dir};
3165 }
3166 # we ran out of trie
3167 # (shouldn't happen: it's either no match, or end marker)
3168 push @filtered, $pr;
3169 }
3170
3171 return @filtered;
3172}
3173
3174# note: fill_project_list_info must be run first,
3175# for 'descr_long' and 'ctags' to be filled
3176sub search_projects_list {
3177 my ($projlist, %opts) = @_;
3178 my $tagfilter = $opts{'tagfilter'};
e65ceb61 Jakub Narębski2012-03-02 23:34:24 +01003179 my $search_re = $opts{'search_regexp'};
12b1443c
JN
Jakub Narębski2011-04-29 19:51:56 +02003180
3181 return @$projlist
e65ceb61 Jakub Narębski2012-03-02 23:34:24 +01003182 unless ($tagfilter || $search_re);
12b1443c Jakub Narębski2011-04-29 19:51:56 +02003183
07b257f9
JN
Jakub Narębski2012-02-23 16:54:48 +01003184 # searching projects require filling to be run before it;
3185 fill_project_list_info($projlist,
3186 $tagfilter ? 'ctags' : (),
aa145bf6 Junio C Hamano2012-03-08 13:04:49 -08003187 $search_re ? ('path', 'descr') : ());
12b1443c
JN
Jakub Narębski2011-04-29 19:51:56 +02003188 my @projects;
3189 PROJECT:
3190 foreach my $pr (@$projlist) {
3191
3192 if ($tagfilter) {
3193 next unless ref($pr->{'ctags'}) eq 'HASH';
3194 next unless
3195 grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
3196 }
3197
e65ceb61 Jakub Narębski2012-03-02 23:34:24 +01003198 if ($search_re) {
12b1443c Jakub Narębski2011-04-29 19:51:56 +02003199 next unless
e65ceb61
JN
Jakub Narębski2012-03-02 23:34:24 +01003200 $pr->{'path'} =~ /$search_re/ ||
3201 $pr->{'descr_long'} =~ /$search_re/;
12b1443c
JN
Jakub Narębski2011-04-29 19:51:56 +02003202 }
3203
3204 push @projects, $pr;
3205 }
3206
3207 return @projects;
3208}
3209
47852450
JH
Junio C Hamano2007-07-03 22:10:42 -07003210our $gitweb_project_owner = undef;
3211sub git_get_project_list_from_file {
1e0cf030 Jakub Narębski2006-08-14 02:10:06 +02003212
47852450 Junio C Hamano2007-07-03 22:10:42 -07003213 return if (defined $gitweb_project_owner);
1e0cf030 Jakub Narębski2006-08-14 02:10:06 +02003214
47852450 Junio C Hamano2007-07-03 22:10:42 -07003215 $gitweb_project_owner = {};
1e0cf030
JN
Jakub Narębski2006-08-14 02:10:06 +02003216 # read from file (url-encoded):
3217 # 'git%2Fgit.git Linus+Torvalds'
3218 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3219 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3220 if (-f $projects_list) {
dff2b6d4 Jakub Narębski2009-05-10 02:38:34 +02003221 open(my $fd, '<', $projects_list);
1e0cf030
JN
Jakub Narębski2006-08-14 02:10:06 +02003222 while (my $line = <$fd>) {
3223 chomp $line;
3224 my ($pr, $ow) = split ' ', $line;
3225 $pr = unescape($pr);
3226 $ow = unescape($ow);
47852450 Junio C Hamano2007-07-03 22:10:42 -07003227 $gitweb_project_owner->{$pr} = to_utf8($ow);
1e0cf030
JN
Jakub Narębski2006-08-14 02:10:06 +02003228 }
3229 close $fd;
3230 }
47852450
JH
Junio C Hamano2007-07-03 22:10:42 -07003231}
3232
3233sub git_get_project_owner {
3234 my $project = shift;
3235 my $owner;
3236
3237 return undef unless $project;
b59012ef Bruno Ribas2008-02-08 14:38:04 -02003238 $git_dir = "$projectroot/$project";
47852450
JH
Junio C Hamano2007-07-03 22:10:42 -07003239
3240 if (!defined $gitweb_project_owner) {
3241 git_get_project_list_from_file();
3242 }