12 use base
qw(Exporter);
13 our @EXPORT = qw(get_git scrypt jailed_file sendmail_pipe mailer_pipe
14 lock_file unlock_file valid_tag rand_adjust
15 filedb_atomic_append filedb_atomic_edit filedb_grep
16 filedb_atomic_grep valid_email valid_email_multi
17 valid_repo_url valid_web_url url_base url_path url_server
18 projects_html_list parse_rfc2822_date parse_any_date
19 extract_url_hostname is_dns_hostname is_our_hostname
20 get_cmd online_cpus sys_pagesize sys_memsize
21 calc_windowmemory to_utf8 capture_command human_size
22 calc_bigfilethreshold has_reserved_suffix
23 noFatalsToBrowser calc_redeltathreshold
24 clean_email_multi read_HEAD_symref read_config_file
25 read_config_file_hash is_git_dir git_bool);
30 $encoder = Encode
::find_encoding
('Windows-1252') ||
31 Encode
::find_encoding
('ISO-8859-1') or
32 die "failed to load ISO-8859-1 encoder\n";
36 my ($str, $encode) = @_;
37 return undef unless defined $str;
39 if (Encode
::is_utf8
($str) || utf8
::decode
($str)) {
42 $ans = $encoder->decode($str, Encode
::FB_DEFAULT
);
44 utf8
::encode
($ans) if $encode;
48 BEGIN {require "Girocco/extra/capture_command.pl"}
50 # Return the entire output sent to stdout from running a command
51 # Any output the command sends to stderr is discarded
52 # Returns undef if there was an error running the command (see $!)
54 my ($status, $result) = capture_command
(1, undef, @_);
55 return defined($status) && $status == 0 ?
$result : undef;
58 # Same as get_cmd except configured git binary is automatically provided
59 # as the first argument to get_cmd
61 return get_cmd
($Girocco::Config
::git_bin
, @_);
66 crypt($pwd||'', join ('', ('.', '/', 0..9, 'A'..'Z', 'a'..'z')[rand 64, rand 64]));
72 $Girocco::Config
::chroot."/$filename";
81 use Fcntl
qw(O_WRONLY O_CREAT O_EXCL);
83 my $handle = new IO
::Handle
;
85 unless (sysopen($handle, $path, O_WRONLY
|O_CREAT
|O_EXCL
)) {
87 while (not sysopen($handle, $path, O_WRONLY
|O_CREAT
|O_EXCL
)) {
88 ($! == EEXIST
) or die "$path open failed: $!";
89 ($cnt++ < 16) or die "$path open failed: cannot open lockfile";
93 # XXX: filedb-specific
94 chmod 0664, $path or die "$path g+w failed: $!";
100 return defined($_[0]) && $_[0] eq jailed_file
('/etc/passwd');
103 sub _run_update_pwd_db
{
104 my ($path, $updatearg) = @_;
105 my @cmd = ($Girocco::Config
::basedir
.'/bin/update-pwd-db', "$path");
106 push(@cmd, $updatearg) if $updatearg;
107 system(@cmd) == 0 or die "update-pwd-db failed: $?";
111 my ($path, $noreplace, $updatearg) = @_;
114 _run_update_pwd_db
("$path.lock", $updatearg)
115 if $Girocco::Config
::update_pwd_db
&& _is_passwd_file
($path);
116 rename "$path.lock", $path or die "$path unlock failed: $!";
118 unlink "$path.lock" or die "$path unlock failed: $!";
122 sub filedb_atomic_append
{
123 my ($file, $line, $updatearg) = @_;
126 open my $src, '<', $file or die "$file open for reading failed: $!";
127 my $dst = lock_file
($file);
130 my $aid = (split /:/)[2];
131 $id = $aid + 1 if ($aid >= $id);
133 print $dst $_ or die "$file(l) write failed: $!";
136 $line =~ s/\\i/$id/g;
137 print $dst "$line\n" or die "$file(l) write failed: $!";
139 close $dst or die "$file(l) close failed: $!";
142 unlock_file
($file, 0, $updatearg);
147 sub filedb_atomic_edit
{
148 my ($file, $fn, $updatearg) = @_;
150 open my $src, '<', $file or die "$file open for reading failed: $!";
151 my $dst = lock_file
($file);
154 print $dst $fn->($_) or die "$file(l) write failed: $!";
157 close $dst or die "$file(l) close failed: $!";
160 unlock_file
($file, 0, $updatearg);
163 sub filedb_atomic_grep
{
164 my ($file, $fn) = @_;
167 open my $src, '<', $file or die "$file open for reading failed: $!";
168 my $dst = lock_file
($file);
171 my $result = $fn->($_);
172 push(@results, $result) if $result;
175 close $dst or die "$file(l) close failed: $!";
178 unlock_file
($file, 1);
183 my ($file, $fn) = @_;
186 open my $src, '<', $file or die "$file open for reading failed: $!";
189 my $result = $fn->($_);
190 push(@results, $result) if $result;
200 defined($email) or $email = '';
201 return $email =~ /^[a-zA-Z0-9+._-]+@[a-zA-Z0-9.-]+$/;
204 sub clean_email_multi
{
206 defined($input) or $input = '';
207 $input =~ s/^\s+//; $input =~ s/\s+$//;
210 foreach (split(/\s*,\s*/, $input)) {
212 $seen{lc($_)} = 1, push(@newlist, $_) unless $seen{lc($_)};
214 return join(",", @newlist);
217 sub valid_email_multi
{
218 # each email address must be a valid_email but we silently
219 # ignore extra spaces at the beginning/end and around any comma(s)
220 foreach (split(/,/, clean_email_multi
(shift))) {
221 return 0 unless valid_email
($_);
228 defined($url) or $url = '';
230 /^https?:\/\
/[a-zA-Z0-9.:-]+(\/[_\
%a-zA
-Z0
-9.\
/~:?&=;-]*)?(#[a-zA-Z0-9._-]+)?$/;
234 my $url = shift || '';
235 # Currently neither username nor password is allowed in the URL and IPv6
236 # literal addresses are not accepted either.
237 $Girocco::Config
::mirror_svn
&&
238 $url =~ /^svn(\+https?)?:\/\
/[a-zA-Z0-9.:-]+(\/[_\
%a-zA
-Z0
-9.\
/~-]*)?$/os
240 $Girocco::Config
::mirror_darcs
&&
241 $url =~ /^darcs:\/\
/[a-zA-Z0-9.:-]+(\/[_\
%a-zA
-Z0
-9.\
/~-]*)?$/os
243 $Girocco::Config
::mirror_bzr
&&
244 $url =~ /^bzr:\/\
/[a-zA-Z0-9.:-]+(\/[_\
%a-zA
-Z0
-9.\
/~-]*)?$/os
246 $Girocco::Config
::mirror_hg
&&
247 $url =~ /^hg\+https?:\/\
/[a-zA-Z0-9.:-]+(\/[_\
%a-zA
-Z0
-9.\
/~-]*)?$/os
249 return $url =~ /^(https?|git):\/\
/[a-zA-Z0-9.:-]+(\/[_\
%a-zA
-Z0
-9.\
/~-]*)?$/;
252 sub extract_url_hostname
{
253 my $url = shift || '';
254 if ($url =~ m
,^bzr
://,) {
256 return 'launchpad.net' if $url =~ /^lp:/;
258 return undef unless $url =~ m
,^[A
-Za
-z0
-9+.-]+://[^/],;
259 $url =~ s
,^[A
-Za
-z0
-9+.-]+://,,;
260 $url =~ s
,^([^/]+).*$,$1,;
261 $url =~ s/:[0-9]*$//;
262 $url =~ s/^[^\@]*[\@]//;
263 return $url ?
$url : undef;
267 # RFC 1034 section 3.5
268 # RFC 1123 section 2.1
269 # RFC 1738 section 3.1
270 # RFC 2606 sections 2 & 3
271 # RFC 3986 section 3.2.2
272 sub is_dns_hostname
{
274 defined($host) or $host = '';
275 return 0 if $host eq '' || $host =~ /\s/;
276 # first remove a trailing '.'
278 return 0 if length($host) > 255;
279 my $octet = '(?:\d|[1-9]\d|1\d{2}|2[0-4]\d|25[0-5])';
280 return 0 if $host =~ /^$octet\.$octet\.$octet\.$octet$/o;
281 my @labels = split(/[.]/, $host, -1);
282 return 0 unless @labels && @labels >= $Girocco::Config
::min_dns_labels
;
283 # now check each label
284 foreach my $label (@labels) {
285 return 0 unless length($label) > 0 && length($label) <= 63;
286 return 0 unless $label =~ /^[A-Za-z0-9](?:[A-Za-z0-9-]*[A-Za-z0-9])?$/;
288 # disallow RFC 2606 names provided at least two labels are present
290 my $tld = lc($labels[-1]);
296 my $sld = lc($labels[-2]);
297 return 0 if $sld eq 'example' &&
298 ($tld eq 'com' || $tld eq 'net' || $tld eq 'org');
303 sub is_our_hostname
{
304 my $test = shift || '';
308 $Girocco::Config
::gitweburl
,
309 $Girocco::Config
::gitwebfiles
,
310 $Girocco::Config
::webadmurl
,
311 $Girocco::Config
::bundlesurl
,
312 $Girocco::Config
::htmlurl
,
313 $Girocco::Config
::httppullurl
,
314 $Girocco::Config
::httpbundleurl
,
315 $Girocco::Config
::httpspushurl
,
316 $Girocco::Config
::gitpullurl
,
317 $Girocco::Config
::pushurl
319 foreach my $url (@urls) {
321 my $host = extract_url_hostname
($url);
322 if (defined($host)) {
324 $names{lc($host)} = 1;
328 return $names{lc($test)} ?
1 : 0;
331 my (%_oktags, %_badtags, %_canontags, $_canontagscreated, @_whitetags);
333 # These are always okay (a "whitelist") even if they would
334 # otherwise not be allowed
336 .net 2d 3d 6502 68000 68008 68010 68020 68030 68040 68060
337 8086 80286 80386 80486 80586 c cc make www x
339 map({$_oktags{lc($_)}=1} @_whitetags, @Girocco::Config
::allowed_tags
);
340 # entries MUST be all lowercase to be effective
342 # These are "nonsense" or pointless tags
343 about
=>1, after
=>1, all
=>1, also
=>1, an
=>1, and=>1, another
=>1, any
=>1,
344 are
=>1, as
=>1, at
=>1, be
=>1, because
=>1, been
=>1, before
=>1, being
=>1,
345 between
=>1, both
=>1, but
=>1, by
=>1, came
=>1, can
=>1, come
=>1, could
=>1,
346 did
=>1, do=>1, each=>1, for=>1, from
=>1, get
=>1, got
=>1, had
=>1, has
=>1,
347 have
=>1, he
=>1, her
=>1, here
=>1, him
=>1, himself
=>1, his
=>1, how
=>1,
348 if=>1, in=>1, into
=>1, is
=>1, it
=>1, like
=>1, make
=>1, many
=>1, me
=>1,
349 might
=>1, more
=>1, most
=>1, much
=>1, must
=>1, my=>1, never
=>1, now
=>1,
350 of
=>1, oh
=>1, on
=>1, only
=>1, or=>1, other
=>1, our=>1, out
=>1, over
=>1,
351 said
=>1, same
=>1, see
=>1, should
=>1, since
=>1, some
=>1, still
=>1,
352 such
=>1, take
=>1, than
=>1, that
=>1, the
=>1, their
=>1, them
=>1, then
=>1,
353 there
=>1, these
=>1, they
=>1, this
=>1, those
=>1, through
=>1, to
=>1,
354 too
=>1, under
=>1, up
=>1, very
=>1, was
=>1, way
=>1, we
=>1, well
=>1,
355 were
=>1, what
=>1, where
=>1, which
=>1, while=>1, who
=>1, with
=>1,
356 would
=>1, yea
=>1, yeah
=>1, you
=>1, your
=>1, yup
=>1
358 # These are "offensive" tags with at least one letter escaped to
359 # avoid having this file trigger various safe-scan robots
360 $_badtags{"a\x73\x73"} = 1;
361 $_badtags{"a\x73\x73hole"} = 1;
362 $_badtags{"b\x30\x30b"} = 1;
363 $_badtags{"b\x30\x30bs"} = 1;
364 $_badtags{"b\x6f\x6fb"} = 1;
365 $_badtags{"b\x6f\x6fbs"} = 1;
366 $_badtags{"b\x75tt"} = 1;
367 $_badtags{"b\x75ttd\x69\x63k"} = 1;
368 $_badtags{"c\x6f\x63k"} = 1;
369 $_badtags{"c\x75\x6e\x74"} = 1;
370 $_badtags{"d\x69\x63k"} = 1;
371 $_badtags{"d\x69\x63kb\x75tt"} = 1;
372 $_badtags{"f\x75\x63k"} = 1;
373 $_badtags{"in\x63\x65st"} = 1;
374 $_badtags{"ph\x75\x63k"} = 1;
375 $_badtags{"p\x6f\x72n"} = 1;
376 $_badtags{"p\x6f\x72no"} = 1;
377 $_badtags{"p\x6f\x72nographic"} = 1;
378 $_badtags{"p\x72\x30n"} = 1;
379 $_badtags{"p\x72\x6fn"} = 1;
380 $_badtags{"r\x61\x70e"} = 1;
381 $_badtags{"s\x65\x78"} = 1;
382 map({$_badtags{lc($_)}=1} @Girocco::Config
::blocked_tags
);
385 # A valid tag must only have [a-zA-Z0-9:.+#_-] characters, must start with a
386 # letter, must not be a noise word, must be more than one character long,
387 # must not be a repeated letter and must be no more than 32 characters long.
388 # However, anything in %_oktags is explicitly allowed even if it otherwise
389 # would violate the rules (except that none of [,\s\\\/] are allowed in tags).
390 # Returns the canonical name for the tag if the tag is valid otherwise undef.
393 return undef unless defined($_) && $_ ne "" && !/[,\s\/\\]/;
394 my $fold = $Girocco::Config
::foldtags
;
395 if ($fold && !$_canontagscreated) {
398 $_canontags{lc($_)} = $_ foreach sort({$b cmp $a} @_whitetags, @Girocco::Config
::allowed_tags
);
399 $_canontagscreated = 1;
401 return $_canontags{lc($_)} if $fold && exists($_canontags{lc($_)});
402 return ($fold ?
lc($_) : $_) if $_oktags{lc($_)};
403 return undef unless /^[a-zA-Z][a-zA-Z0-9:.+#_-]+$/;
404 return undef if $_badtags{lc($_)};
405 return undef if /^(.)\1+$/;
406 return length($_) <= 32 ?
($fold ?
lc($_) : $_) : undef;
409 # If the passed in argument looks like a URL, return only the stuff up through
410 # the host:port part otherwise return the entire argument.
412 my $url = shift || '';
414 $url = $1.$2.$3.$4 if $url =~ m
,^( [A
-Za
-z
][A
-Za
-z0
-9+.-]*: ) # scheme
415 ( // ) # // separator
416 ((?
:[^\@
]+\@
)?
) # optional userinfo
417 ( [^/?
#]+ ) # host and port
418 (?
:[/?#].*)?$,x; # path and optional query string and/or anchor
422 # If the passed in argument looks like a URL, return only the stuff following
423 # the host:port part otherwise return the entire argument.
424 # If the optional second argument is true, the returned value will have '/'
425 # appended if it does not already end in '/'.
427 my $url = shift || '';
428 my $add_slash = shift || 0;
430 $url = $1 if $url =~ m
,^(?
: [A
-Za
-z
][A
-Za
-z0
-9+.-]*: ) # scheme
431 (?
: // ) # // separator
432 (?
: [^\@
]+\@
)?
# optional userinfo
433 (?
: [^/?
#]+ ) # host and port
434 ((?
:[/?#].*)?)$,x; # path and optional query string and/or anchor
435 $url .= '/' if $add_slash && $url !~ m
|/$|;
439 # If both SERVER_NAME and SERVER_PORT are set pass the argument through url_path
440 # and then prefix it with the appropriate scheme (HTTPS=?on), host and port and
441 # return it. If a something that doesn't look like it could be the start of a
442 # URL path comes back from url_path or SERVER_NAME is a link-local IPv6 address
443 # then just return the argument unchanged.
445 my $url = shift || '';
446 my $path = url_path
($url);
447 return $url unless $path eq '' || $path =~ m
|^[/?
#]|;
448 return $url unless $ENV{'SERVER_NAME'} && $ENV{'SERVER_PORT'} &&
449 $ENV{'SERVER_PORT'} =~ /^[1-9][0-9]{0,4}$/;
450 return $url if $ENV{'SERVER_NAME'} =~ /^[[]?fe80:/i;
451 my $server = $ENV{'SERVER_NAME'};
452 # Deal with Apache bug where IPv6 literal server names do not include
453 # the required surrounding '[' and ']' characters
454 $server = '[' . $server . ']' if $server =~ /:/ && $server !~ /^[[]/;
455 my $ishttps = $ENV{'HTTPS'} && $ENV{'HTTPS'} =~ /^on$/i;
456 my $portnum = 0 + $ENV{'SERVER_PORT'};
458 if (($ishttps && $portnum != 443) || (!$ishttps && $portnum != 80)) {
459 $port = ':' . $portnum;
461 return 'http' . ($ishttps ?
's' : '') . '://' . $server . $port . $path;
464 # Returns the number rounded to the nearest tenths. The ".d" part will be
465 # excluded if it's ".0" unless the optional second argument is true
472 return '' . int($v/10) unless $v % 10 || $use0;
473 return '' . int($v/10) . '.' . ($v%10);
476 # Returns a human-readable size string (e.g. '1.5 MiB') for the value
477 # (in bytes) passed in. Returns '0' for undefined or 0 or not all digits.
478 # Otherwise returns '1 KiB' for < 1024, or else a number rounded to the
479 # nearest tenths of a KiB, MiB or GiB.
482 return "0" unless $v && $v =~ /^\d+$/;
483 return "1 KiB" unless $v > 1024;
485 return _tenths
($v) . " KiB" if $v < 1024;
487 return _tenths
($v) . " MiB" if $v < 1024;
489 return _tenths
($v) . " GiB";
494 $str =~ s/\&/\&/gs;
495 $str =~ s/\</\</gs;
496 $str =~ s/\>/\>/gs;
497 $str =~ s/\"/\"/gs; #"
501 # create relative time string from passed in age in seconds
506 if ($age > 60*60*24*365*2) {
507 $age_str = (int $age/60/60/24/365);
508 $age_str .= " years ago";
509 } elsif ($age > 60*60*24*(365/12)*2) {
510 $age_str = int $age/60/60/24/(365/12);
511 $age_str .= " months ago";
512 } elsif ($age > 60*60*24*7*2) {
513 $age_str = int $age/60/60/24/7;
514 $age_str .= " weeks ago";
515 } elsif ($age > 60*60*24*2) {
516 $age_str = int $age/60/60/24;
517 $age_str .= " days ago";
518 } elsif ($age > 60*60*2) {
519 $age_str = int $age/60/60;
520 $age_str .= " hours ago";
521 } elsif ($age > 60*2) {
522 $age_str = int $age/60;
523 $age_str .= " mins ago";
526 $age_str .= " secs ago";
527 } elsif ($age >= 0) {
528 $age_str = "right now";
530 $age_str = "future time";
535 # create relative time string from passed in idle in seconds
537 my $idle_str = _rel_age
(shift);
538 $idle_str =~ s/ ago//;
539 $idle_str = "not at all" if $idle_str eq "right now";
544 use POSIX
qw(strftime);
545 my ($fmt, $secs, $zonesecs) = @_;
546 my ($S,$M,$H,$d,$m,$y) = gmtime($secs + $zonesecs);
547 $zonesecs = int($zonesecs / 60);
549 my $ans = strftime
($fmt, $S, $M, $H, $d, $m, $y, -1, -1, -1);
553 $zonesecs = -$zonesecs;
557 $z .= sprintf("%02d%02d", int($zonesecs/60), $zonesecs % 60);
562 # Take a list of project names and produce a nicely formated table that
563 # includes owner links and descriptions. If the list is empty returns ''.
564 # The first argument may be a hash ref that contains options. The following
565 # options are available:
566 # target -- sets the target value of the owner link
567 # emptyok -- if true returns an empty table rather than ''
568 # sizecol -- if true include a human-readable size column
569 # typecol -- if true include type column with hover info
570 # changed -- if true include a changed and idle column
571 sub projects_html_list
{
573 if (defined($_[0]) && ref($_[0]) eq 'HASH') {
576 return '' unless @_ || (defined($options->{emptyok
}) && $options->{emptyok
});
577 require Girocco
::Project
;
580 $target = " target=\""._escapeHTML
($options->{target
})."\""
581 if defined($options->{target
});
582 my $withsize = defined($options->{sizecol
}) && $options->{sizecol
};
583 my $withtype = defined($options->{typecol
}) && $options->{typecol
};
584 my $withchanged = defined($options->{changed
}) && $options->{changed
};
586 $sizehead = substr(<<EOT, 0, -1) if $withsize;
587 <th class="sizecol"><span class="hover">Size<span><span class="head">Size</span
588 />Fork size excludes objects borrowed from the parent.</span></span></th
592 $typehead = '<th>Type</th>' if $withtype;
594 $chghead = substr(<<EOT, 0, -1) if $withchanged;
595 <th><span class="hover">Changed<span><span class="head">Changed</span
596 />The last time a ref change was received by this site.</span></span></th
597 ><th><span class="hover">Idle<span><span class="head">Idle</span
598 />The most recent committer time in <i>refs/heads</i>.</span></span></th
602 <table class='projectlist'><tr><th>Project</th>$sizehead$typehead$chghead<th class="desc">Description</th></tr>
604 my $trclass = ' class="odd"';
605 foreach (sort({lc($a) cmp lc($b)} @_)) {
606 if (Girocco
::Project
::does_exist
($_, 1)) {
607 my $proj = Girocco
::Project
->load($_);
608 my $projname = $proj->{name
}.".git";
609 my $projdesc = $proj->{desc
}||'';
610 utf8
::decode
($projdesc) if utf8
::valid
($projdesc);
613 my $psize = $proj->{reposizek
};
614 $psize = undef unless defined($psize) && $psize =~ /^\d+$/;
615 $psize = 0 if !defined($psize) && $proj->is_empty;
616 if (!defined($psize)) {
621 $psize = human_size
($psize * 1024);
622 $psize =~ s/ /\ /g;
624 $sizecol = '<td class="sizecol">'.$psize.'</td>';
628 if ($proj->{mirror
}) {
629 $typecol = substr(<<EOT, 0, -1);
630 <td class="type"><span class="hover">mirror<span class="nowrap">@{[_escapeHTML($proj->{url})]}</span></span></td>
633 my $users = @
{$proj->{users
}};
635 $users .= 's' unless @
{$proj->{users
}} == 1;
636 my $userlist = join(', ', sort({lc($a) cmp lc($b)} @
{$proj->{users
}}));
637 my $spncls = length($userlist) > 25 ?
'' : ' class="nowrap"';
638 $typecol = $userlist ?
substr(<<EOT, 0, -1) : substr(<<EOT, 0, -1);
639 <td
class="type"><span
class="hover">$users<span
$spncls>$userlist</span></span
></td
>
641 <td
class="type">$users</td
>
648 my $changetime = $proj->{lastchange
};
650 $rel = "<span class=\"hover\">" .
651 _rel_age
(time - parse_rfc2822_date
($changetime)) .
652 "<span class=\"nowrap\">$changetime</span></span>";
656 $changecol = substr(<<EOT, 0, -1);
657 <td class="change">$rel</td>
659 my $idletime = $proj->{lastactivity
};
661 $idlesecs = parse_any_date
($idletime, \
$tz) if $idletime;
663 my $idle2822 = _strftime
("%a, %d %b %Y %T %z", $idlesecs, $tz);
664 $rel = "<span class=\"hover\">" .
665 _rel_idle
(time - $idlesecs) .
666 "<span class=\"nowrap\">$idle2822</span></span>";
670 $changecol .= substr(<<EOT, 0, -1);
671 <td class="idle">$rel</td>
675 <tr$trclass><td><a href="@{[url_path($Girocco::Config::gitweburl)]}/$projname"$target
676 >@{[_escapeHTML($projname)]}</td>$sizecol$typecol$changecol<td>@{[_escapeHTML($projdesc)]}</td></tr>
678 $trclass = $trclass ?
'' : ' class="odd"';
685 return ($count || (defined($options->{emptyok
}) && $options->{emptyok
})) ?
$html : '';
691 jan
=> 0, feb
=> 1, mar
=> 2, apr
=> 3, may
=> 4, jun
=> 5,
692 jul
=> 6, aug
=> 7, sep
=> 8, oct => 9, nov
=> 10, dec
=> 11
696 # Should be in "date '+%a, %d %b %Y %T %z'" format as saved to lastgc, lastrefresh and lastchange
697 # The leading "%a, " is optional, returns undef if unrecognized date. This is also known as
698 # RFC 2822 date format and git's '%cD', '%aD' and --date=rfc2822 format.
699 # If the second argument is a SCALAR ref, its value will be set to the TZ offset in seconds
700 sub parse_rfc2822_date
{
701 my $dstr = shift || '';
702 my $tzoff = shift || '';
703 $dstr = $1 if $dstr =~/^[^\s]+,\s*(.*)$/;
704 return undef unless $dstr =~
705 /^\s*(\d{1,2})\s+([A-Za-z]{3})\s+(\d{4})\s+(\d{1,2}):(\d{2}):(\d{2})\s+([+-]\d{4})\s*$/;
706 my ($d,$b,$Y,$H,$M,$S,$z) = ($1,$2,$3,$4,$5,$6,$7);
707 my $m = $_month_names{lc($b)};
708 return undef unless defined($m);
709 my $seconds = timegm
(0+$S, 0+$M, 0+$H, 0+$d, 0+$m, $Y-1900);
710 my $offset = 60 * (60 * (0+substr($z,1,2)) + (0+substr($z,3,2)));
711 $offset = -$offset if substr($z,0,1) eq '-';
712 $$tzoff = $offset if ref($tzoff) eq 'SCALAR';
713 return $seconds - $offset;
716 # Will parse any supported date format. Actually there are three formats
717 # currently supported:
718 # 1. RFC 2822 (uses parse_rfc2822_date)
719 # 2. RFC 3339 / ISO 8601 (T may be ' ' or '_', 'Z' is optional or may be 'UTC', ':' optional in TZ)
720 # 3. Same as #2 except no colons or hyphens allowed and hours MUST be 2 digits
721 # 4. unix seconds since epoch with optional +/- trailing TZ (may not have a ':')
722 # Returns undef if unsupported date.
723 # If the second argument is a SCALAR ref, its value will be set to the TZ offset in seconds
725 my $dstr = shift || '';
726 my $tzoff = shift || '';
727 if ($dstr =~ /^\s*([-+]?\d+)(?:\s+([-+]\d{4}))?\s*$/) {
733 $off = 60 * (60 * (0+substr($z,1,2)) + (0+substr($z,3,2)));
734 $off = -$off if substr($z,0,1) eq '-';
736 $$tzoff = $off if ref($tzoff) eq 'SCALAR';
739 if ($dstr =~ /^\s*(\d{4})-(\d{2})-(\d{2})[Tt _](\d{1,2}):(\d{2}):(\d{2})(?:[ _]?([Zz]|[Uu][Tt][Cc]|(?:[-+]\d{1,2}:?\d{2})))?\s*$/ ||
740 $dstr =~ /^\s*(\d{4})(\d{2})(\d{2})[Tt _](\d{2})(\d{2})(\d{2})(?:[ _]?([Zz]|[Uu][Tt][Cc]|(?:[-+]\d{2}\d{2})))?\s*$/) {
741 my ($Y,$m,$d,$H,$M,$S,$z) = ($1,$2,$3,$4,$5,$6,$7||'');
742 my $seconds = timegm
(0+$S, 0+$M, 0+$H, 0+$d, $m-1, $Y-1900);
743 defined($z) && $z ne '' or $z = 'Z';
746 substr($z,1,0) = '0' if length($z) == 4;
748 if ($z ne 'Z' && $z ne 'UTC') {
749 $off = 60 * (60 * (0+substr($z,1,2)) + (0+substr($z,3,2)));
750 $off = -$off if substr($z,0,1) eq '-';
752 $$tzoff = $off if ref($tzoff) eq 'SCALAR';
753 return $seconds - $off;
755 return parse_rfc2822_date
($dstr, $tzoff);
758 # Input is a number such as a minute interval
759 # Return value is a random number between the input and 1.25*input
760 # This can be used to randomize the update and gc operations a bit to avoid
761 # having them all end up all clustered together
763 my $input = shift || 0;
764 return $input unless $input;
765 return $input + int(rand(0.25 * $input));
768 # Open a pipe to a new sendmail process. The '-i' option is always passed to
769 # the new process followed by any addtional arguments passed in. Note that
770 # the sendmail process is only expected to understand the '-i', '-t' and '-f'
771 # options. Using any other options via this function is not guaranteed to work.
772 # A list of recipients may follow the options. Combining a list of recipients
773 # with the '-t' option is not recommended.
775 return undef unless @_;
776 die "\$Girocco::Config::sendmail_bin is unset or not executable!\n"
777 unless $Girocco::Config
::sendmail_bin
&& -x
$Girocco::Config
::sendmail_bin
;
778 my $result = open(my $pipe, '|-', $Girocco::Config
::sendmail_bin
, '-i', @_);
779 return $result ?
$pipe : undef;
782 # Open a pipe that works similarly to a mailer such as /usr/bin/mail in that
783 # if the first argument is '-s', a subject line will be automatically added
784 # (using the second argument as the subject). Any remaining arguments are
785 # expected to be recipient addresses that will be added to an explicit To:
786 # line as well as passed on to sendmail_pipe. In addition an
787 # "Auto-Submitted: auto-generated" header is always added as well as a suitable
791 if (@_ >= 2 && $_[0] eq '-s') {
795 my $tolist = join(", ", @_);
796 unshift(@_, '-f', $Girocco::Config
::sender
) if $Girocco::Config
::sender
;
797 my $pipe = sendmail_pipe
(@_);
799 print $pipe "From: \"$Girocco::Config::name\" ",
800 "($Girocco::Config::title) ",
801 "<$Girocco::Config::admin>\n";
802 print $pipe "To: $tolist\n";
803 print $pipe "Subject: $subject\n" if defined($subject);
804 print $pipe "MIME-Version: 1.0\n";
805 print $pipe "Content-Type: text/plain; charset=utf-8\n";
806 print $pipe "Content-Transfer-Encoding: 8bit\n";
807 print $pipe "X-Girocco: $Girocco::Config::gitweburl\n"
808 unless $Girocco::Config
::suppress_x_girocco
;
809 print $pipe "Auto-Submitted: auto-generated\n";
817 return undef unless defined($val);
818 $val =~ s/[\r\n]+$//s;
819 return undef unless $val =~ /^\d+$/;
821 return undef unless $val >= 1;
825 # Returns the number of "online" cpus or undef if undetermined
827 my @confcpus = $^O
eq "linux" ?
828 qw(_NPROCESSORS_ONLN NPROCESSORS_ONLN) :
829 qw(NPROCESSORS_ONLN _NPROCESSORS_ONLN) ;
830 my $cpus = _goodval
(get_cmd
('getconf', $confcpus[0]));
831 return $cpus if $cpus;
832 $cpus = _goodval
(get_cmd
('getconf', $confcpus[1]));
833 return $cpus if $cpus;
834 if ($^O
ne "linux") {
835 my @sysctls = qw(hw.ncpu);
836 unshift(@sysctls, qw(hw.availcpu)) if $^O
eq "darwin";
837 foreach my $mib (@sysctls) {
838 $cpus = _goodval
(get_cmd
('sysctl', '-n', $mib));
839 return $cpus if $cpus;
845 # Returns the system page size in bytes or undef if undetermined
846 # This should never fail on a POSIX system
848 use POSIX
":unistd_h";
849 my $pagesize = sysconf
(_SC_PAGESIZE
);
850 return undef unless defined($pagesize) && $pagesize =~ /^\d+$/;
851 $pagesize = 0 + $pagesize;
852 return undef unless $pagesize >= 256;
856 # Returns the amount of available physical memory in bytes
857 # This may differ from the actual amount of physical memory installed
858 # Returns undef if this cannot be determined
860 my $pagesize = sys_pagesize
;
861 if ($pagesize && $^O
eq "linux") {
862 my $pages = _goodval
(get_cmd
('getconf', '_PHYS_PAGES'));
863 return $pagesize * $pages if $pages;
865 if ($^O
ne "linux") {
866 my @sysctls = qw(hw.physmem64);
867 unshift(@sysctls, qw(hw.memsize)) if $^O
eq "darwin";
868 foreach my $mib (@sysctls) {
869 my $memsize = _goodval
(get_cmd
('sysctl', '-n', $mib));
870 return $memsize if $memsize;
872 my $memsize32 = _goodval
(get_cmd
('sysctl', '-n', 'hw.physmem'));
873 return $memsize32 if $memsize32 && $memsize32 <= 2147483647;
875 my $pages = _goodval
(get_cmd
('sysctl', '-n', 'hw.availpages'));
876 return $pagesize * $pages if $pages;
878 return 2147483647 + 1 if $memsize32;
883 sub _get_max_conf_suffixed_size
{
885 return undef unless defined $conf && $conf =~ /^(\d+)([kKmMgG]?)$/;
886 my ($val, $suffix) = (0+$1, lc($2));
887 $val *= 1024 if $suffix eq 'k';
888 $val *= 1024 * 1024 if $suffix eq 'm';
889 $val *= 1024 * 1024 * 1024 if $suffix eq 'g';
893 sub _make_suffixed_size
{
895 return $size if $size % 1024;
897 return "${size}k" if $size % 1024;
899 return "${size}m" if $size % 1024;
904 # Return the value to pass to --window-memory= for git repack
905 # If the system memory or number of CPUs cannot be determined, returns "1g"
906 # Otherwise returns one third the available memory divided by the number of CPUs
907 # but never more than 1 gigabyte or max_gc_window_memory_size.
908 sub calc_windowmemory
{
909 my $cpus = online_cpus
;
910 my $memsize = sys_memsize
;
911 my $max = 1024 * 1024 * 1024;
912 if ($cpus && $memsize) {
913 $max = int($memsize / 3 / $cpus);
914 $max = 1024 * 1024 * 1024 if $max >= 1024 * 1024 * 1024;
916 my $maxconf = _get_max_conf_suffixed_size
($Girocco::Config
::max_gc_window_memory_size
);
917 $max = $maxconf if defined($maxconf) && $maxconf && $max > $maxconf;
918 return _make_suffixed_size
($max);
921 # Return the value to set as core.bigFileThreshold for git repack
922 # If the system memory cannot be determined, returns "256m"
923 # Otherwise returns the available memory divided by 16
924 # but never more than 512 megabytes or max_gc_big_file_threshold_size.
925 sub calc_bigfilethreshold
{
926 my $memsize = sys_memsize
;
927 my $max = 256 * 1024 * 1024;
929 $max = int($memsize / 16);
930 $max = 512 * 1024 * 1024 if $max >= 512 * 1024 * 1024;
932 my $maxconf = _get_max_conf_suffixed_size
($Girocco::Config
::max_gc_big_file_threshold_size
);
933 $max = $maxconf if defined($maxconf) && $maxconf && $max > $maxconf;
934 return _make_suffixed_size
($max);
937 # Return the value to use when deciding whether or not to re-calculate object deltas
938 # If there are no more than this many objects then deltas will be recomputed in
939 # order to create more efficient pack files. The new_delta_threshold value
940 # is constrained to be at least 1000 * cpu cores and no more than 100000.
941 # The default is sys_memsize rounded up to the nearest multiple of 256 MB and
942 # then 5000 per 256 MB or 50000 if we cannot determine memory size but never
943 # more than 100000 or less than 1000 * cpu cores.
944 sub calc_redeltathreshold
{
945 my $cpus = online_cpus
|| 1;
946 if (defined($Girocco::Config
::new_delta_threshold
) &&
947 $Girocco::Config
::new_delta_threshold
=~ /^\d+/) {
948 my $ndt = 0 + $Girocco::Config
::new_delta_threshold
;
949 if ($ndt >= $cpus * 1000) {
950 return $ndt <= 100000 ?
$ndt : 100000;
954 my $memsize = sys_memsize
;
956 my $quantum = 256 * 1024 * 1024;
957 $calcval = 5000 * int(($memsize + ($quantum - 1)) / $quantum);
958 $calcval = 1000 * $cpus if $calcval < 1000 * $cpus;
959 $calcval = 100000 if $calcval > 100000;
964 # $1 => thing to test
965 # $2 => optional directory, if given and -e "$2/$1$3", then return false
966 # $3 => optional, defaults to ''
967 sub has_reserved_suffix
{
968 no warnings
; # avoid silly 'unsuccessful stat on filename with \n' warning
969 my ($name, $dir, $ext) = @_;
970 $ext = '' unless defined $ext;
971 return 0 unless defined $name && $name =~ /\.([^.]+)$/;
972 return 0 unless exists $Girocco::Config
::reserved_suffixes
{lc($1)};
973 return 0 if defined $dir && -e
"$dir/$name$ext";
977 # mostly undoes effect of `use CGI::Carp qw(fatalsToBrowser);`
978 # mostly undoes effect of `use CGI::Carp qw(warningsToBrowser);`
979 sub noFatalsToBrowser
{
980 delete $SIG{__DIE__
};
981 delete $SIG{__WARN__
};
982 undef *CORE
::GLOBAL
::die;
983 *CORE
::GLOBAL
::die = sub {
985 my $ec = $! || ($?
>> 8) || 255;
986 my (undef, $fn, $li) = caller(0);
987 my $loc = " at " . $fn . " line " . $li . ".\n";
989 $msg = join("", @_) if @_;
990 $msg = "Died" if $msg eq "";
991 $msg .= $loc unless $msg =~ /\n$/;
993 printf STDERR
"%s", $msg;
996 undef *CORE
::GLOBAL
::warn;
997 *CORE
::GLOBAL
::warn = sub {
999 my (undef, $fn, $li) = caller(0);
1000 my $loc = " at " . $fn . " line " . $li . ".\n";
1002 $msg = join("", @_) if @_;
1003 $msg = "Warning: something's wrong" if $msg eq "";
1004 $msg .= $loc unless $msg =~ /\n$/;
1005 printf STDERR
"%s", $msg;
1009 # mimics Git's symref reading but only for HEAD
1010 # returns undef on failure or if HEAD is not a symbolic ref
1011 sub read_HEAD_symref
{
1012 my $headpath = $_[0] . "/HEAD";
1014 my $rl = readlink($headpath);
1015 return defined($rl) && $rl =~ m
,^refs
/., ?
$rl : undef;
1017 open my $fd, '<', $headpath or return undef;
1024 defined($hv) or return undef;
1026 return $hv =~ m
,^ref:\s
*(refs
/.+)$, ?
$1 : undef;
1039 $_[0] =~ s/\\([btn\042\\])/$escvals{$1}/g;
1044 # mimics Git's config.c git_parse_source function behavior
1045 # returns array of arrayref of key and value
1046 # except that valueless booleans have a value of undef
1047 sub read_config_file
{
1049 my ($fn, $warn) = @_;
1053 open my $fh, '<', $fn or
1054 $warn && warn("could not open \"$fn\": $!\n"), return(undef);
1058 warn "bad config line $li in file $fn\n" if $warn;
1065 s/^\x{feff}// if $li == 1;
1067 if (/^\s*\[(.*)$/) {
1069 if ($l =~ /^([.a-zA-Z0-9-]+)\](.*)$/) {
1070 $section = lc($1) . ".";
1072 } elsif ($l =~ /^([.a-zA-Z0-9-]*)\s+"((?:[^\042\\\n]|\\.)*)"\](.*)$/) {
1073 $section = lc($1) . "." .
1074 &{sub{my $x=shift; $x =~ s/\\(.)/$1/g; $x}}($2) . ".";
1080 next if /^\s*(?:[;#]|$)/;
1082 if (/^([a-zA-Z][a-zA-Z0-9-]*)[ \t]*(.*)$/) {
1083 my $k = $section . lc($1);
1087 } elsif ($v =~ /^=\s*(.*)$/) {
1096 if (!$qt && $pd =~ /^((?:[^"\\\n;#]|\\[btn"\\])+)/) {
1098 $pd = substr($pd, length($a));
1099 if ($pd =~ /^[;#]/) {
1104 $v .= &$cf_unesc($a);
1105 } elsif ($qt && $pd =~ /^((?:[^"\\\n]|\\[btn"\\])+)/) {
1107 $pd = substr($pd, length($a));
1108 $v .= &$cf_unesc($a);
1109 } elsif ($pd =~ /^\042/) {
1111 $pd = substr($pd, 1);
1112 } elsif (!$qt && $pd =~ /^[;#]/) {
1114 } elsif ($pd eq "\\") {
1118 $pd =~ s/(?:\r\n|\n)$//;
1119 $pd = to_utf8
($pd, 1);
1120 $pd =~ s/^\s+// unless $v ne "" || $qt;
1132 push(@vals, [$k, $v]);
1141 # Same as read_config_file except that a hashref is returned and
1142 # subsequent same-key-name values replace earlier ones.
1143 # Also valueless booleans are given the value 1
1144 sub read_config_file_hash
{
1145 my $result = read_config_file
(@_);
1146 return undef unless defined($result);
1147 my %config = map {($$_[0], defined($$_[1])?
$$_[1]:1)} @
$result;
1151 # similar to Git's test except that GIT_OBJECT_DIRECTORY is ignored
1154 defined($gd) && $gd ne "" && -d
$gd or return undef;
1155 -d
"$gd/objects" && -x
"$gd/objects" or return 0;
1156 -d
"$gd/refs" && -x
"$gd/refs" or return 0;
1157 if (-l
"$gd/HEAD") {
1158 my $rl = readlink("$gd/HEAD");
1159 defined($rl) && $rl =~ m
,^refs
/., or return 0;
1160 -e
"$gd/HEAD" or return 1;
1162 open my $fd, '<', "$gd/HEAD" or return 0;
1169 defined $hv or return 0;
1171 $hv =~ m
,^ref:\s
*refs
/., and return 1;
1172 return $hv =~ /^[0-9a-f]{40}/;
1175 # Returns 0 for false, 1 for true, undef for unrecognized or undef
1176 # Unless the optional second argument is true in which case undef returns 1
1178 defined($_[0]) or return $_[1] ?
1 : undef;
1180 return 0 if $v eq 'false' || $v eq 'off' || $v eq 'no' || $v eq '' || $v =~ /^[-+]?0+$/;
1181 return 1 if $v eq 'true' || $v eq 'on' || $v eq 'yes' || $v =~ /^[-+]?0*[1-9][0-9]*$/;