git.git: update to v2.10.4
[girocco.git] / shlib.sh
blobfa4f0055bde252f1de5b1de78ba0262dcfa68633
1 #!/bin/sh
3 # This is generic shell library for all the scripts used by Girocco;
4 # most importantly, it introduces all the $cfg_* shell variables.
6 # SHA-1 patterns
7 octet='[0-9a-f][0-9a-f]'
8 octet4="$octet$octet$octet$octet"
9 octet19="$octet4$octet4$octet4$octet4$octet$octet$octet"
10 octet20="$octet4$octet4$octet4$octet4$octet4"
11 nullsha="0000000000000000000000000000000000000000"
12 # tab
13 tab="$(printf '\t')"
15 # set a sane umask that never excludes any user or group permissions
16 umask $(printf '0%03o' $(( $(umask) & ~0770 )) )
18 vcmp() {
19 # Compare $1 to $2 each of which must match \d+(\.\d+)*
20 # An empty string ('') for $1 or $2 is treated like 0
21 # Outputs:
22 # -1 if $1 < $2
23 # 0 if $1 = $2
24 # 1 if $1 > $2
25 # Note that `vcmp 1.8 1.8.0.0.0.0` correctly outputs 0.
26 while
27 _a="${1%%.*}"
28 _b="${2%%.*}"
29 [ -n "$_a" -o -n "$_b" ]
31 if [ "${_a:-0}" -lt "${_b:-0}" ]; then
32 echo -1
33 return
34 elif [ "${_a:-0}" -gt "${_b:-0}" ]; then
35 echo 1
36 return
38 _a2="${1#$_a}"
39 _b2="${2#$_b}"
40 set -- "${_a2#.}" "${_b2#.}"
41 done
42 echo 0
45 unset orig_path
46 get_girocco_config_pm_var_list() (
47 # Export all the variables from Girocco::Config to suitable var= lines
48 # prefixing them with 'cfg_'. E.g. $cfg_admin is admin's mail address now
49 # and also setting a 'defined_cfg_' prefix to 1 if they are not undef.
50 __girocco_conf="$GIROCCO_CONF"
51 [ -n "$__girocco_conf" ] || __girocco_conf="Girocco::Config"
52 [ -z "$basedir" ] || __girocco_extrainc="-I$basedir"
53 [ -z "$orig_path" ] || { PATH="$orig_path" && export PATH; }
54 perl -I@basedir@ $__girocco_extrainc -M$__girocco_conf -le \
55 'foreach (sort {uc($a) cmp uc($b)} keys %Girocco::Config::) {
56 my $val = ${$Girocco::Config::{$_}}; defined($val) or $val="";
57 $val =~ s/([\\"\$\`])/\\$1/gos;
58 $val =~ s/(?:\r\n|\r|\n)$//os;
59 print "cfg_$_=\"$val\"";
60 print "defined_cfg_$_=",
61 (defined(${$Girocco::Config::{$_}})?"1":"");
65 # Returns full command path for "$1" if it's a valid command otherwise returns "$1"
66 _fcp() {
67 if _fp="$(command -v "$1" 2>/dev/null)"; then
68 printf '%s\n' "$_fp"
69 else
70 printf '%s\n' "$1"
74 get_girocco_config_var_list() (
75 # Same as get_girocco_config_pm_var_list except that
76 # the following variables (all starting with var_) are added:
77 # var_group cfg_owning_group if defined otherwise `id -gn`
78 # var_git_ver The version number part from `git version`
79 # var_git_exec_path The result of $cfg_git_bin --exec-dir
80 # var_sh_bin Full path to the posix sh interpreter to use
81 # var_perl_bin Full path to the perl interpreter to use
82 # var_gzip_bin Full path to the gzip executable to use
83 # var_nc_openbsd_bin Full path to the netcat (nc) with -U support
84 # var_have_git_171 Set to 1 if git version >= 1.7.1 otherwise ''
85 # var_have_git_172 Set to 1 if git version >= 1.7.2 otherwise ''
86 # var_have_git_173 Set to 1 if git version >= 1.7.3 otherwise ''
87 # var_have_git_1710 Set to 1 if git version >= 1.7.10 otherwise ''
88 # var_have_git_185 Set to 1 if git version >= 1.8.5 otherwise ''
89 # var_window_memory Value to use for repack --window-memory=
90 # var_big_file_threshold Value to use for core.bigFileThreshold
91 # var_redelta_threshold Recompute deltas if no more than this many objs
92 # var_upload_window If not "", pack.window to use for upload-pack
93 # var_log_window_size Value to use for git-svn --log-window-size=
94 # var_utf8_locale Value to use for a UTF-8 locale if available
95 # var_xargs_r A "-r" if xargs needs it to behave correctly
96 # var_du_exclude Option to exclude PATTERN from du if available
97 # var_du_follow Option to follow command line sym links if available
98 _cfg_vars="$(get_girocco_config_pm_var_list)"
99 eval "$_cfg_vars"
100 printf '%s\n' "$_cfg_vars"
101 printf 'var_group=%s\n' "${cfg_owning_group:-$(id -gn)}"
102 _gver="$("$cfg_git_bin" version 2>/dev/null | \
103 LC_ALL=C sed -ne 's/^[^0-9]*\([0-9][0-9]*\(\.[0-9][0-9]*\)*\).*$/\1/p')"
104 printf 'var_git_ver=%s\n' "$_gver"
105 printf 'var_git_exec_path="%s"\n' "$("$cfg_git_bin" --exec-path 2>/dev/null)"
106 printf 'var_sh_bin="%s"\n' "$(_fcp "${cfg_posix_sh_bin:-/bin/sh}")"
107 printf 'var_perl_bin="%s"\n' "$(_fcp "${cfg_perl_bin:-$(unset -f perl; command -v perl)}")"
108 printf 'var_gzip_bin="%s"\n' "$(_fcp "${cfg_gzip_bin:-$(unset -f gzip; command -v gzip)}")"
109 printf 'var_nc_openbsd_bin="%s"\n' "$(_fcp "${cfg_nc_openbsd_bin:-$(unset -f nc; command -v nc)}")"
110 printf 'var_have_git_171=%s\n' "$([ $(vcmp "$_gver" 1.7.1) -ge 0 ] && echo 1)"
111 printf 'var_have_git_172=%s\n' "$([ $(vcmp "$_gver" 1.7.2) -ge 0 ] && echo 1)"
112 printf 'var_have_git_173=%s\n' "$([ $(vcmp "$_gver" 1.7.3) -ge 0 ] && echo 1)"
113 printf 'var_have_git_1710=%s\n' "$([ $(vcmp "$_gver" 1.7.10) -ge 0 ] && echo 1)"
114 printf 'var_have_git_185=%s\n' "$([ $(vcmp "$_gver" 1.8.5) -ge 0 ] && echo 1)"
115 __girocco_conf="$GIROCCO_CONF"
116 [ -n "$__girocco_conf" ] || __girocco_conf="Girocco::Config"
117 [ -z "$basedir" ] || __girocco_extrainc="-I$basedir"
118 printf "var_window_memory=%s\n" \
119 "$(perl -I@basedir@ $__girocco_extrainc -M$__girocco_conf \
120 -MGirocco::Util -e 'print calc_windowmemory')"
121 printf "var_big_file_threshold=%s\n" \
122 "$(perl -I@basedir@ $__girocco_extrainc -M$__girocco_conf \
123 -MGirocco::Util -e 'print calc_bigfilethreshold')"
124 printf "var_redelta_threshold=%s\n" \
125 "$(perl -I@basedir@ $__girocco_extrainc -M$__girocco_conf \
126 -MGirocco::Util -e 'print calc_redeltathreshold')"
127 if [ -n "$cfg_upload_pack_window" ] && [ "$cfg_upload_pack_window" -ge 2 ] && \
128 [ "$cfg_upload_pack_window" -le 50 ]; then
129 printf "var_upload_window=%s\n" "$cfg_upload_pack_window"
130 else
131 printf "var_upload_window=%s\n" ""
133 printf 'var_log_window_size=%s\n' "${cfg_svn_log_window_size:-250}"
134 # We parse the output of `locale -a` and select a suitable UTF-8 locale.
135 _guess_locale="$(locale -a | LC_ALL=C grep -viE '^(posix|c)(\..*)?$' | \
136 LC_ALL=C grep -iE '\.utf-?8$' | LC_ALL=C sed -e 's/\.[Uu][Tt][Ff]-*8$//' | \
137 LC_ALL=C sed -e '/en_US/ s/^/0 /; /en_US/ !s/^/1 /' | LC_ALL=C sort | \
138 head -n 1 | LC_ALL=C cut -d ' ' -f 2)"
139 [ -z "$_guess_locale" ] || printf 'var_utf8_locale=%s.UTF-8\n' "$_guess_locale"
140 # On some broken platforms running xargs without -r and empty input runs the command
141 printf 'var_xargs_r=%s\n' "$(: | command xargs echo -r)"
142 # The disk usage report produces better numbers if du has an exclude option
143 _x0="$(basename "$0")"
144 _x0="${_x0%?}?*"
145 for _duopt in --exclude -I; do
146 if _test="$(du $_duopt 's?lib.s*' $_duopt "$_x0" "$0" 2>/dev/null)" && [ -z "$_test" ]; then
147 printf 'var_du_exclude=%s\n' "$_duopt"
148 break
150 done
151 if _test="$(du -H "$0" 2>/dev/null)" && [ -n "$_test" ]; then
152 printf 'var_du_follow=%s\n' "-H"
153 break
157 # If basedir has been replaced, and shlib_vars.sh exists, get the config
158 # definitions from it rather than running Perl.
159 if [ "@basedir@" = '@'basedir'@' ] || ! [ -r "@basedir@/shlib_vars.sh" ]; then
160 # Import all the variables from Girocco::Config to the local environment,
161 eval "$(get_girocco_config_var_list)"
162 else
163 # Import the variables from shlib_vars.sh which avoids needlessly
164 # running another copy of Perl
165 . "@basedir@/shlib_vars.sh"
168 # git_add_config "some.var=value"
169 # every ' in value must be replaced with the 4-character sequence '\'' before
170 # calling this function or Git will barf. Will not be effective unless running
171 # Git version 1.7.3 or later.
172 git_add_config() {
173 GIT_CONFIG_PARAMETERS="${GIT_CONFIG_PARAMETERS:+$GIT_CONFIG_PARAMETERS }'$1'"
174 export GIT_CONFIG_PARAMETERS
177 # Make sure we have a reproducible environment by using a controlled HOME dir
178 XDG_CONFIG_HOME="$cfg_chroot/var/empty"
179 HOME="$cfg_chroot/etc/girocco"
180 TMPDIR="/tmp"
181 GIT_CONFIG_NOSYSTEM=1
182 GIT_ATTR_NOSYSTEM=1
183 GIT_NO_REPLACE_OBJECTS=1
184 GIT_TERMINAL_PROMPT=0
185 GIT_ASKPASS="$cfg_basedir/bin/git-askpass-password"
186 export XDG_CONFIG_HOME
187 export HOME
188 export TMPDIR
189 export GIT_CONFIG_NOSYSTEM
190 export GIT_ATTR_NOSYSTEM
191 export GIT_NO_REPLACE_OBJECTS
192 export GIT_TERMINAL_PROMPT
193 export GIT_ASKPASS
194 unset GIT_USER_AGENT
195 unset GIT_HTTP_USER_AGENT
196 if [ -n "$defined_cfg_git_client_ua" ]; then
197 GIT_USER_AGENT="$cfg_git_client_ua"
198 export GIT_USER_AGENT
199 GIT_HTTP_USER_AGENT="$cfg_git_client_ua"
200 export GIT_HTTP_USER_AGENT
202 unset GIT_CONFIG_PARAMETERS
203 git_add_config "core.ignoreCase=false"
204 if [ -n "$cfg_git_no_mmap" ]; then
205 # Just like compiling with NO_MMAP
206 git_add_config "core.packedGitWindowSize=1m"
207 else
208 # Always use the 32-bit default (32m) even on 64-bit to avoid memory blowout
209 git_add_config "core.packedGitWindowSize=32m"
211 [ -z "$var_big_file_threshold" ] ||
212 git_add_config "core.bigFileThreshold=$var_big_file_threshold"
214 # Make sure any sendmail.pl config is always available
215 unset SENDMAIL_PL_HOST
216 unset SENDMAIL_PL_PORT
217 unset SENDMAIL_PL_NCBIN
218 unset SENDMAIL_PL_NCOPT
219 [ -z "$cfg_sendmail_pl_host" ] || { SENDMAIL_PL_HOST="$cfg_sendmail_pl_host" && export SENDMAIL_PL_HOST; }
220 [ -z "$cfg_sendmail_pl_port" ] || { SENDMAIL_PL_PORT="$cfg_sendmail_pl_port" && export SENDMAIL_PL_PORT; }
221 [ -z "$cfg_sendmail_pl_ncbin" ] || { SENDMAIL_PL_NCBIN="$cfg_sendmail_pl_ncbin" && export SENDMAIL_PL_NCBIN; }
222 [ -z "$cfg_sendmail_pl_ncopt" ] || { SENDMAIL_PL_NCOPT="$cfg_sendmail_pl_ncopt" && export SENDMAIL_PL_NCOPT; }
224 # Set PATH and PYTHON to the values set by Config.pm, if any
225 unset PYTHON
226 [ -z "$cfg_python" ] || { PYTHON="$cfg_python" && export PYTHON; }
227 [ -z "$cfg_path" ] || { orig_path="$PATH" && PATH="$cfg_path" && export PATH; }
229 # Extra GIT variables that generally ought to be cleared, but whose clearing
230 # could potentially interfere with the correct operation of hook scripts so
231 # they are segregated into a separate function for use as appropriate
232 clean_git_env() {
233 unset GIT_ALTERNATE_OBJECT_DIRECTORIES
234 unset GIT_CONFIG
235 unset GIT_DIR
236 unset GIT_GRAFT_FILE
237 unset GIT_INDEX_FILE
238 unset GIT_OBJECT_DIRECTORY
239 unset GIT_NAMESPACE
242 # We cannot use a git() {} or nc_openbsd() {} function to redirect git
243 # and nc_openbsd to the desired executables because when using
244 # "ENV_VAR=xxx func" the various /bin/sh implementations behave in various
245 # different and unexpected ways:
246 # a) treat "ENV_VAR=xxx" like a separate, preceding "export ENV_VAR=xxx"
247 # b) treat "ENV_VAR=xxx" like a separate, prededing "ENV_VAR=xxx"
248 # c) treat "ENV_VAR=xxx" like a temporary setting only while running func
249 # None of these are good. We want a temporary "export ENV_VAR=xxx"
250 # setting only while running func which none of the /bin/sh's do.
252 # Instead we'd like to use an alias that provides the desired behavior without
253 # any of the bad (a), (b) or (c) effects.
255 # However, unfortunately, some of the crazy /bin/sh implementations do not
256 # recognize alias expansions when preceded by variable assignments!
258 # So we are left with git() {} and nc_openbsd() {} functions and in the
259 # case of git() {} we can compensate for (b) and (c) failing to export
260 # but not (a) and (b) persisting the values so the caller will simply
261 # have to beware and explicitly unset any variables that should not persist
262 # beyond the function call itself.
264 git() (
265 [ "${GIT_DIR+set}" = "set" ] && export GIT_DIR
266 [ "${GIT_SSL_NO_VERIFY+set}" = "set" ] && export GIT_SSL_NO_VERIFY
267 [ "${GIT_TRACE_PACKET+set}" = "set" ] && export GIT_TRACE_PACKET
268 [ "${GIT_USER_AGENT+set}" = "set" ] && export GIT_USER_AGENT
269 [ "${GIT_HTTP_USER_AGENT+set}" = "set" ] && export GIT_HTTP_USER_AGENT
270 exec "$cfg_git_bin" "$@"
273 # Since we do not yet require at least Git 1.8.5 this is a compatibility function
274 # that allows us to use git update-ref --stdin where supported and the slow shell
275 # script where not, but only the "delete" operation is currently supported.
276 git_updateref_stdin() {
277 if [ -n "$var_have_git_185" ]; then
278 git update-ref --stdin
279 else
280 while read -r _op _ref; do
281 case "$_op" in
282 delete)
283 git update-ref -d "$_ref"
286 echo "bad git_updateref_stdin op: $_op" >&2
287 exit 1
289 esac
290 done
294 # see comments for git() -- callers must explicitly export all variables
295 # intended for the commands these functions run before calling them
296 perl() { command "${var_perl_bin:-perl}" "$@"; }
297 gzip() { command "${var_gzip_bin:-gzip}" "$@"; }
299 nc_openbsd() { command "$var_nc_openbsd_bin" "$@"; }
301 list_packs() { command "$cfg_basedir/bin/list_packs" "$@"; }
303 strftime() { command "$cfg_basedir/bin/strftime" "$@"; }
305 # Some platforms' broken xargs runs the command always at least once even if
306 # there's no input unless given a special option. Automatically supply the
307 # option on those platforms by providing an xargs function.
308 xargs() { command xargs $var_xargs_r "$@"; }
310 _addrlist() {
311 _list=
312 for _addr in "$@"; do
313 [ -z "$_list" ] || _list="$_list, "
314 _list="$_list$_addr"
315 done
316 echo "$_list"
319 _sendmail() {
320 _mailer="${cfg_sendmail_bin:-/usr/sbin/sendmail}"
321 if [ -n "$cfg_sender" ]; then
322 "$_mailer" -i -f "$cfg_sender" "$@"
323 else
324 "$_mailer" -i "$@"
328 mail() {
329 _subject=
330 if [ "$1" = "-s" ]; then
331 shift
332 _subject="$1"
333 shift
336 echo "From: \"$cfg_name\" ($cfg_title) <$cfg_admin>"
337 echo "To: $(_addrlist "$@")"
338 [ -z "$_subject" ] || echo "Subject: $_subject"
339 echo "MIME-Version: 1.0"
340 echo "Content-Type: text/plain; charset=UTF-8"
341 echo "Content-Transfer-Encoding: 8bit"
342 [ -n "$cfg_suppress_x_girocco" ] || echo "X-Girocco: $cfg_gitweburl"
343 echo "Auto-Submitted: auto-generated"
344 echo ""
346 } | _sendmail "$@"
349 # bang CMD... will execute the command with well-defined failure mode;
350 # set bang_action to string of the failed action ('clone', 'update', ...);
351 # re-define the bang_trap() function to do custom cleanup before bailing out
352 bang() {
353 bang_active=1
354 bang_cmd="$*"
355 bang_errcode=0
356 if [ -n "$show_progress" ]; then
357 exec 3>&1
358 read -r bang_errcode <<-EOT || :
360 exec 4>&3 3>&1 1>&4 4>&-
361 { "$@" 3>&- || echo $? >&3; } 2>&1 | tee -i -a "$bang_log"
364 exec 3>&-
365 if [ -z "$bang_errcode" ] || [ "$bang_errcode" = "0" ]; then
366 # All right. Cool.
367 bang_active=
368 bang_cmd=
369 return;
371 else
372 if "$@" >>"$bang_log" 2>&1; then
373 # All right. Cool.
374 bang_active=
375 bang_cmd=
376 return;
377 else
378 bang_errcode="$?"
381 bang_failed
384 bang_failed() {
385 bang_active=
386 unset GIT_DIR
387 touch .banged
388 cat "$bang_log" > .banglog
389 echo "" >> .banglog
390 echo "$bang_cmd failed with error code $bang_errcode" >> .banglog
391 if [ -n "$show_progress" ]; then
392 echo ""
393 echo "$bang_cmd failed with error code $bang_errcode"
395 if [ -e .bangagain ]; then
396 git config --remove-section girocco.bang 2>/dev/null || :
397 rm -f .bangagain
399 bangcount="$(git config --int girocco.bang.count 2>/dev/null || :)"
400 : ${bangcount:=0}
401 bangcount=$(( $bangcount + 1 ))
402 git config --int girocco.bang.count $bangcount
403 if [ $bangcount -eq 1 ]; then
404 git config girocco.bang.firstfail "$(TZ=UTC date "+%Y-%m-%d %T UTC")"
406 if [ $bangcount -ge $cfg_min_mirror_failure_message_count ] && \
407 [ "$(git config --bool girocco.bang.messagesent 2>/dev/null || :)" != "true" ] && \
408 ! check_interval "girocco.bang.firstfail" $cfg_min_mirror_failure_message_interval; then
409 bangmailok="$(git config --bool gitweb.statusupdates 2>/dev/null || echo true)"
410 bangaddrs=''
411 [ "$bangmailok" = "false" -o -z "$mail" ] || bangaddrs="$mail"
412 [ -z "$cfg_admincc" -o "$cfg_admincc" = "0" -o -z "$cfg_admin" ] ||
413 if [ -z "$bangaddrs" ]; then bangaddrs="$cfg_admin"; else bangaddrs="$bangaddrs,$cfg_admin"; fi
414 rsubj=
415 [ $bangcount -le 1 ] || rsubj=" repeatedly"
416 [ -z "$bangaddrs" ] ||
418 echo "$bang_cmd failed with error code $bang_errcode"
419 echo ""
420 rsubj=
421 if [ $bangcount -gt 1 ]; then
422 echo "$bangcount consecutive update failures have occurred since $(config_get girocco.bang.firstfail)"
423 echo ""
425 echo "you will not receive any more notifications until recovery"
426 echo "this status message may be disabled on the project admin page"
427 echo ""
428 echo "Log follows:"
429 echo ""
430 cat "$bang_log"
431 } | mail -s "[$cfg_name] $proj $bang_action failed$rsubj" "$bangaddrs"
432 git config --bool girocco.bang.messagesent true
434 bangthrottle=
435 [ $bangcount -lt 15 ] || \
436 check_interval "girocco.bang.firstfail" $(( $cfg_min_mirror_interval * 3 / 2 )) || \
437 bangthrottle=1
438 bang_trap $bangthrottle
439 [ -n "$bang_errcode" ] && [ "$bang_errcode" != "0" ] || bang_errcode=1
440 exit $bang_errcode
443 # bang_eval CMD... will evaluate the command with well-defined failure mode;
444 # Identical to bang CMD... except the command is eval'd instead of executed.
445 bang_eval() {
446 bang eval "$*"
449 # Default bang settings:
450 bang_setup() {
451 bang_active=
452 bang_action="lame_programmer"
453 bang_trap() { :; }
454 bang_tmpdir="${TMPDIR:-/tmp}"
455 bang_tmpdir="${bang_tmpdir%/}"
456 bang_log="$(mktemp "${bang_tmpdir:-/tmp}/repomgr-XXXXXX")"
457 is_git_dir . || {
458 echo "bang_setup called with current directory not a git directory" >&2
459 exit 1
461 trap 'rm -f "$bang_log"' EXIT
462 trap '[ -z "$bang_active" ] || { bang_errcode=130; bang_failed; }; exit 130' INT
463 trap '[ -z "$bang_active" ] || { bang_errcode=143; bang_failed; }; exit 143' TERM
466 # Remove banged status
467 bang_reset() {
468 rm -f .banged .bangagain .banglog
469 git config --remove-section girocco.bang 2>/dev/null || :
472 # Check to see if banged status
473 is_banged() {
474 [ -e .banged ]
477 # Check to see if banged message was sent
478 was_banged_message_sent() {
479 [ "$(git config --bool girocco.bang.messagesent 2>/dev/null || :)" = "true" ]
482 # Progress report - if show_progress is set, shows the given message.
483 progress() {
484 [ ! -n "$show_progress" ] || echo "$@"
487 # Project config accessors; must be run in project directory
488 config_get() {
489 case "$1" in
490 *.*)
491 git config "$1";;
493 git config "gitweb.$1";;
494 esac
497 config_set() {
498 git config "gitweb.$1" "$2" && chgrp $var_group config && chmod g+w config
501 config_set_raw() {
502 git config "$1" "$2" && chgrp $var_group config && chmod g+w config
505 config_get_date_seconds() {
506 _dt="$(config_get "$1" || :)"
507 [ -n "$_dt" ] || return 1
508 _ds="$(perl -I@basedir@ -MGirocco::Util -e "print parse_any_date('$_dt')")"
509 [ -n "$_ds" ] || return 1
510 echo "$_ds"
513 # Tool for checking whether given number of seconds has not passed yet
514 check_interval() {
515 os="$(config_get_date_seconds "$1")" || return 1
516 ns="$(date +%s)"
517 [ $ns -lt $(($os+$2)) ]
520 # Check if we are running with effective root permissions
521 is_root() {
522 [ "$(id -u 2>/dev/null)" = "0" ]
525 # Check to see if the single argument is a Git directory
526 is_git_dir() {
527 # Just like Git's test except we ignore GIT_OBJECT_DIRECTORY
528 # And we are slightly more picky (must be refs/.+ not refs/.*)
529 [ -d "$1/objects" -a -x "$1/objects" ] || return 1
530 [ -d "$1/refs" -a -x "$1/refs" ] || return 1
531 if [ -L "$1/HEAD" ]; then
532 _hr="$(readlink "$1/HEAD")"
533 case "$_hr" in "refs/"?*) :;; *) return 1;; esac
535 [ -f "$1/HEAD" -a -r "$1/HEAD" ] || return 1
536 read -r _hr <"$1/HEAD" || return 1
537 case "$_hr" in
538 $octet20 | ref:refs/?*)
539 return 0;;
540 ref:*)
541 _hr="${_hr##ref:*[ $tab]}"
542 case "$_hr" in "refs/"?*) return 0;; esac
543 esac
544 return 1
547 # List all Git repositories, with given prefix if specified, one-per-line
548 # All project names starting with _ are always excluded from the result
549 get_repo_list() {
550 if [ -n "$1" ]; then
551 LC_ALL=C cut -d : -f 1,3 "$cfg_chroot"/etc/group | LC_ALL=C grep "^$1"
552 else
553 LC_ALL=C cut -d : -f 1,3 "$cfg_chroot"/etc/group
554 fi | while IFS=: read name id; do
555 [ $id -lt 65536 ] || case "$name" in _*) :;; ?*) echo "$name"; esac
556 done
559 # Return success if the given project name has any forks
560 has_forks() {
561 _prj="${1%.git}"
562 [ -n "$_prj" ] || return 1
563 [ -d "$cfg_reporoot/$_prj" ] || return 1
564 is_git_dir "$cfg_reporoot/$_prj.git" || return 1
565 test $(get_repo_list "$_prj/[^/][^/]*:" | LC_ALL=C wc -l) -gt 0
568 # returns empty string and error for empty string otherwise one of
569 # m => normal Git mirror
570 # s => mirror from svn source
571 # d => mirror from darcs source
572 # b => mirror from bzr source
573 # h => mirror from hg source
574 # w => mirror from mediawiki source
575 # f => mirror from other fast-import source
576 # note that if the string is non-empty and none of s, d, b or h match the
577 # return will always be type m regardless of whether it's a valid Git URL
578 get_url_mirror_type() {
579 case "$1" in
581 return 1
583 svn://* | svn+http://* | svn+https://* | svn+file://* | svn+ssh://*)
584 echo 's'
586 darcs://*)
587 echo 'd'
589 bzr://*)
590 echo 'b'
592 hg+http://* | hg+https://* | hg+file://* | hg+ssh://* | hg::*)
593 echo 'h'
595 mediawiki::*)
596 echo 'w'
599 echo 'm'
601 esac
602 return 0
605 # returns false for empty string
606 # returns true if the passed in url is a mirror using git fast-import
607 is_gfi_mirror_url() {
608 [ -n "$1" ] || return 1
609 case "$(get_url_mirror_type "$1" 2>/dev/null || :)" in
610 d|b|h|w|f)
611 # darcs, bzr, hg and mediawiki mirrors use git fast-import
612 # and so do generic "f" fast-import mirrors
613 return 0
616 # Don't think git-svn currently uses git fast-import
617 # And Git mirrors certainly do not
618 return 1
620 esac
621 # assume it does not use git fast-import
622 return 1
625 # returns false for empty string
626 # returns true if the passed in url is a mirror using git-svn
627 is_svn_mirror_url() {
628 [ -n "$1" ] || return 1
629 [ "$(get_url_mirror_type "$1" 2>/dev/null || :)" = "s" ]
632 # returns mirror url for gitweb.baseurl of git directory
633 # (GIT_DIR) passed in as the argument (which defaults to "." if omitted)
634 # will fail if the directory does not have .nofetch and gitweb.baseurl
635 # comes back empty -- otherwise .nofetch directories succeed with a "" return
636 # automatically strips any leading "disabled " prefix before returning result
637 get_mirror_url() {
638 _gitdir="${1:-.}"
639 # always return empty for non-mirrors
640 [ ! -e "$_gitdir/.nofetch" ] || return 0
641 _url="$(GIT_DIR="$_gitdir" config_get baseurl 2>/dev/null || :)"
642 _url="${_url##* }"
643 [ -n "$_url" ] || return 1
644 printf '%s\n' "$_url"
645 return 0
648 # returns get_url_mirror_type for gitweb.baseurl of git directory
649 # (GIT_DIR) passed in as the argument (which defaults to "." if omitted)
650 # will fail if the directory does not have .nofetch and gitweb.baseurl
651 # comes back empty -- otherwise .nofetch directories succeed with a "" return
652 # automatically strips any leading "disabled " prefix before testing
653 get_mirror_type() {
654 _url="$(get_mirror_url "$@")" || return 1
655 get_url_mirror_type "$_url"
658 # returns true if the passed in git dir (defaults to ".") is a mirror using git fast-import
659 is_gfi_mirror() {
660 _url="$(get_mirror_url "$@")" || return 1
661 is_gfi_mirror_url "$_url"
664 # returns true if the passed in git dir (defaults to ".") is a mirror using git-svn
665 is_svn_mirror() {
666 _url="$(get_mirror_url "$@")" || return 1
667 is_svn_mirror_url "$_url"
670 # current directory must already be set to Git repository
671 # if girocco.headok is already true succeeds without doing anything
672 # if rev-parse --verify HEAD succeeds sets headok=true and succeeds
673 # otherwise tries to set HEAD to a symbolic ref to refs/heads/master
674 # then refs/heads/trunk and finally the first top-level head from
675 # refs/heads/* (i.e. only two slashes in the name) and finally any
676 # existing refs/heads. The first one to succeed wins and sets headok=true
677 # and then a successful exit. Otherwise headok is left unset with a failure exit
678 # We use the girocco.headok flag to make sure we only force a valid HEAD symref
679 # when the repository is being set up -- if the HEAD is later deleted (through
680 # a push or fetch --prune) that's no longer our responsibility to fix
681 check_and_set_head() {
682 [ "$(git config --bool girocco.headok 2>/dev/null || :)" != "true" ] || return 0
683 if git rev-parse --verify --quiet HEAD >/dev/null; then
684 git config --bool girocco.headok true
685 return 0
687 for _hr in refs/heads/master refs/heads/trunk; do
688 if git rev-parse --verify --quiet "$_hr"; then
689 _update_head_symref "$_hr"
690 return 0
692 done
693 git for-each-ref --format="%(refname)" refs/heads 2>/dev/null |
694 while read -r _hr; do
695 case "${_hr#refs/heads/}" in */*) :;; *)
696 _update_head_symref "$_hr"
697 exit 1 # exit subshell created by "|"
698 esac
699 done || return 0
700 _hr="$(git for-each-ref --format="%(refname)" refs/heads 2>/dev/null | head -n 1 || :)"
701 if [ -n "$_hr" ]; then
702 _update_head_symref "$_hr"
703 return 0
705 return 1
707 _update_head_symref() {
708 git symbolic-ref HEAD "$1"
709 git config --bool girocco.headok true
710 ! [ -d htmlcache ] || { >htmlcache/changed; } 2>/dev/null || :
713 # A well-known UTF-8 locale is required for some of the fast-import providers
714 # in order to avoid mangling characters. Ideally we could use "POSIX.UTF-8"
715 # but that is not reliably UTF-8 but rather usually US-ASCII.
716 # We parse the output of `locale -a` and select a suitable UTF-8 locale at
717 # install time and store that in $var_utf8_locale if one is found.
718 # If we cannot find one in the `locale -a` output then we just use a well-known
719 # UTF-8 locale and hope for the best. We set LC_ALL to our choice and export
720 # it. We only set this temporarily when running the fast-import providers.
721 set_utf8_locale() {
722 LC_ALL="${var_utf8_locale:-en_US.UTF-8}"
723 export LC_ALL
726 # hg-fast-export | git fast-import with error handling in current directory GIT_DIR
727 git_hg_fetch() (
728 set_utf8_locale
729 _python="${PYTHON:-python}"
730 rm -f hg2git-marks.old hg2git-marks.new
731 if [ -f hg2git-marks -a -s hg2git-marks ]; then
732 LC_ALL=C sed 's/^:\([^ ][^ ]*\) \([^ ][^ ]*\)$/\2 \1/' <hg2git-marks | {
733 if [ -n "$var_have_git_185" ]; then
734 git cat-file --batch-check=':%(rest) %(objectname)'
735 else
736 LC_ALL=C sed 's/^\([^ ][^ ]*\) \([^ ][^ ]*\)$/:\2 \1/'
738 } | LC_ALL=C sed '/ missing$/d' >hg2git-marks.old
739 if [ -n "$var_have_git_171" ] && \
740 git rev-parse --quiet --verify refs/notes/hg >/dev/null; then
741 if [ -z "$var_have_git_185" ] || \
742 ! LC_ALL=C cmp -s hg2git-marks hg2git-marks.old; then
743 _nm='hg-fast-export'
744 GIT_AUTHOR_NAME="$_nm"
745 GIT_COMMITTER_NAME="$_nm"
746 GIT_AUTHOR_EMAIL="$_nm"
747 GIT_COMMITTER_EMAIL="$_nm"
748 export GIT_AUTHOR_NAME
749 export GIT_COMMITTER_NAME
750 export GIT_AUTHOR_EMAIL
751 export GIT_COMMITTER_EMAIL
752 git notes --ref=refs/notes/hg prune
753 unset GIT_AUTHOR_NAME
754 unset GIT_COMMITTER_NAME
755 unset GIT_AUTHOR_EMAIL
756 unset GIT_COMMITTER_EMAIL
759 else
760 >hg2git-marks.old
762 _err1=
763 _err2=
764 exec 3>&1
765 { read -r _err1 || :; read -r _err2 || :; } <<-EOT
767 exec 4>&3 3>&1 1>&4 4>&-
769 _e1=0
770 _af="$(git config hg.authorsfile || :)"
771 _cmd='GIT_DIR="$(pwd)" "$_python" "$cfg_basedir/bin/hg-fast-export.py" \
772 --repo "$(pwd)/repo.hg" \
773 --marks "$(pwd)/hg2git-marks.old" \
774 --mapping "$(pwd)/hg2git-mapping" \
775 --heads "$(pwd)/hg2git-heads" \
776 --status "$(pwd)/hg2git-state" \
777 -U unknown --force --flatten --hg-hash'
778 [ -z "$_af" ] || _cmd="$_cmd"' --authors "$_af"'
779 eval "$_cmd" 3>&- || _e1=$?
780 echo $_e1 >&3
781 } | \
783 _e2=0
784 git fast-import \
785 --import-marks="$(pwd)/hg2git-marks.old" \
786 --export-marks="$(pwd)/hg2git-marks.new" \
787 --export-pack-edges="$(pwd)/gfi-packs" \
788 --force 3>&- || _e2=$?
789 echo $_e2 >&3
793 exec 3>&-
794 [ "$_err1" = 0 -a "$_err2" = 0 ] || return 1
795 mv -f hg2git-marks.new hg2git-marks
796 rm -f hg2git-marks.old
797 git for-each-ref --format='%(refname) %(objectname)' refs/heads | \
798 LC_ALL=C sed -e 's,^refs/heads/,:,' >hg2git-heads