src/common/util.c

   1 /* Copyright (c) 2003, Roger Dingledine
   2  * Copyright (c) 2004-2006, Roger Dingledine, Nick Mathewson.
   3  * Copyright (c) 2007-2015, The Tor Project, Inc. */
   4 /* See LICENSE for licensing information */
   5
   6 /**
   7  * \file util.c
   8  * \brief Common functions for strings, IO, network, data structures,
   9  * process control.
  10  **/
  11
  12 /* This is required on rh7 to make strptime not complain.
  13  */
  14 #define _GNU_SOURCE
  15
  16 #include "orconfig.h"
  17 #ifdef HAVE_FCNTL_H
  18 #include <fcntl.h>
  19 #endif
  20 #define UTIL_PRIVATE
  21 #include "util.h"
  22 #include "torlog.h"
  23 #include "crypto.h"
  24 #include "torint.h"
  25 #include "container.h"
  26 #include "address.h"
  27 #include "sandbox.h"
  28 #include "backtrace.h"
  29 #include "util_process.h"
  30 #include "util_format.h"
  31
  32 #ifdef _WIN32
  33 #include <io.h>
  34 #include <direct.h>
  35 #include <process.h>
  36 #include <tchar.h>
  37 #include <winbase.h>
  38 #else
  39 #include <dirent.h>
  40 #include <pwd.h>
  41 #include <grp.h>
  42 #endif
  43
  44 /* math.h needs this on Linux */
  45 #ifndef _USE_ISOC99_
  46 #define _USE_ISOC99_ 1
  47 #endif
  48 #include <math.h>
  49 #include <stdlib.h>
  50 #include <stdio.h>
  51 #include <string.h>
  52 #include <assert.h>
  53 #include <signal.h>
  54
  55 #ifdef HAVE_NETINET_IN_H
  56 #include <netinet/in.h>
  57 #endif
  58 #ifdef HAVE_ARPA_INET_H
  59 #include <arpa/inet.h>
  60 #endif
  61 #ifdef HAVE_ERRNO_H
  62 #include <errno.h>
  63 #endif
  64 #ifdef HAVE_SYS_SOCKET_H
  65 #include <sys/socket.h>
  66 #endif
  67 #ifdef HAVE_SYS_TIME_H
  68 #include <sys/time.h>
  69 #endif
  70 #ifdef HAVE_UNISTD_H
  71 #include <unistd.h>
  72 #endif
  73 #ifdef HAVE_SYS_STAT_H
  74 #include <sys/stat.h>
  75 #endif
  76 #ifdef HAVE_SYS_FCNTL_H
  77 #include <sys/fcntl.h>
  78 #endif
  79 #ifdef HAVE_TIME_H
  80 #include <time.h>
  81 #endif
  82 #ifdef HAVE_MALLOC_MALLOC_H
  83 #include <malloc/malloc.h>
  84 #endif
  85 #ifdef HAVE_MALLOC_H
  86 #if !defined(OPENBSD) && !defined(__FreeBSD__)
  87 /* OpenBSD has a malloc.h, but for our purposes, it only exists in order to
  88  * scold us for being so stupid as to autodetect its presence.  To be fair,
  89  * they've done this since 1996, when autoconf was only 5 years old. */
  90 #include <malloc.h>
  91 #endif
  92 #endif
  93 #ifdef HAVE_MALLOC_NP_H
  94 #include <malloc_np.h>
  95 #endif
  96 #ifdef HAVE_SYS_WAIT_H
  97 #include <sys/wait.h>
  98 #endif
  99 #if defined(HAVE_SYS_PRCTL_H) && defined(__linux__)
 100 #include <sys/prctl.h>
 101 #endif
 102
 103 #ifdef __clang_analyzer__
 104 #undef MALLOC_ZERO_WORKS
 105 #endif
 106
 107 /* =====
 108  * Assertion helper.
 109  * ===== */
 110 /** Helper for tor_assert: report the assertion failure. */
 111 void
 112 tor_assertion_failed_(const char *fname, unsigned int line,
 113                       const char *func, const char *expr)
 114 {
 115   char buf[256];
 116   log_err(LD_BUG, "%s:%u: %s: Assertion %s failed; aborting.",
 117           fname, line, func, expr);
 118   tor_snprintf(buf, sizeof(buf),
 119                "Assertion %s failed in %s at %s:%u",
 120                expr, func, fname, line);
 121   log_backtrace(LOG_ERR, LD_BUG, buf);
 122 }
 123
 124 /* =====
 125  * Memory management
 126  * ===== */
 127 #ifdef USE_DMALLOC
 128  #undef strndup
 129  #include <dmalloc.h>
 130  /* Macro to pass the extra dmalloc args to another function. */
 131  #define DMALLOC_FN_ARGS , file, line
 132
 133  #if defined(HAVE_DMALLOC_STRDUP)
 134  /* the dmalloc_strdup should be fine as defined */
 135  #elif defined(HAVE_DMALLOC_STRNDUP)
 136  #define dmalloc_strdup(file, line, string, xalloc_b) \
 137          dmalloc_strndup(file, line, (string), -1, xalloc_b)
 138  #else
 139  #error "No dmalloc_strdup or equivalent"
 140  #endif
 141
 142 #else /* not using dmalloc */
 143
 144  #define DMALLOC_FN_ARGS
 145 #endif
 146
 147 /** Allocate a chunk of <b>size</b> bytes of memory, and return a pointer to
 148  * result.  On error, log and terminate the process.  (Same as malloc(size),
 149  * but never returns NULL.)
 150  *
 151  * <b>file</b> and <b>line</b> are used if dmalloc is enabled, and
 152  * ignored otherwise.
 153  */
 154 void *
 155 tor_malloc_(size_t size DMALLOC_PARAMS)
 156 {
 157   void *result;
 158
 159   tor_assert(size < SIZE_T_CEILING);
 160
 161 #ifndef MALLOC_ZERO_WORKS
 162   /* Some libc mallocs don't work when size==0. Override them. */
 163   if (size==0) {
 164     size=1;
 165   }
 166 #endif
 167
 168 #ifdef USE_DMALLOC
 169   result = dmalloc_malloc(file, line, size, DMALLOC_FUNC_MALLOC, 0, 0);
 170 #else
 171   result = malloc(size);
 172 #endif
 173
 174   if (PREDICT_UNLIKELY(result == NULL)) {
 175     log_err(LD_MM,"Out of memory on malloc(). Dying.");
 176     /* If these functions die within a worker process, they won't call
 177      * spawn_exit, but that's ok, since the parent will run out of memory soon
 178      * anyway. */
 179     exit(1);
 180   }
 181   return result;
 182 }
 183
 184 /** Allocate a chunk of <b>size</b> bytes of memory, fill the memory with
 185  * zero bytes, and return a pointer to the result.  Log and terminate
 186  * the process on error.  (Same as calloc(size,1), but never returns NULL.)
 187  */
 188 void *
 189 tor_malloc_zero_(size_t size DMALLOC_PARAMS)
 190 {
 191   /* You may ask yourself, "wouldn't it be smart to use calloc instead of
 192    * malloc+memset?  Perhaps libc's calloc knows some nifty optimization trick
 193    * we don't!"  Indeed it does, but its optimizations are only a big win when
 194    * we're allocating something very big (it knows if it just got the memory
 195    * from the OS in a pre-zeroed state).  We don't want to use tor_malloc_zero
 196    * for big stuff, so we don't bother with calloc. */
 197   void *result = tor_malloc_(size DMALLOC_FN_ARGS);
 198   memset(result, 0, size);
 199   return result;
 200 }
 201
 202 /* The square root of SIZE_MAX + 1.  If a is less than this, and b is less
 203  * than this, then a*b is less than SIZE_MAX.  (For example, if size_t is
 204  * 32 bits, then SIZE_MAX is 0xffffffff and this value is 0x10000.  If a and
 205  * b are less than this, then their product is at most (65535*65535) ==
 206  * 0xfffe0001. */
 207 #define SQRT_SIZE_MAX_P1 (((size_t)1) << (sizeof(size_t)*4))
 208
 209 /** Return non-zero if and only if the product of the arguments is exact. */
 210 static inline int
 211 size_mul_check(const size_t x, const size_t y)
 212 {
 213   /* This first check is equivalent to
 214      (x < SQRT_SIZE_MAX_P1 && y < SQRT_SIZE_MAX_P1)
 215
 216      Rationale: if either one of x or y is >= SQRT_SIZE_MAX_P1, then it
 217      will have some bit set in its most significant half.
 218    */
 219   return ((x|y) < SQRT_SIZE_MAX_P1 ||
 220           y == 0 ||
 221           x <= SIZE_MAX / y);
 222 }
 223
 224 /** Allocate a chunk of <b>nmemb</b>*<b>size</b> bytes of memory, fill
 225  * the memory with zero bytes, and return a pointer to the result.
 226  * Log and terminate the process on error.  (Same as
 227  * calloc(<b>nmemb</b>,<b>size</b>), but never returns NULL.)
 228  * The second argument (<b>size</b>) should preferably be non-zero
 229  * and a compile-time constant.
 230  */
 231 void *
 232 tor_calloc_(size_t nmemb, size_t size DMALLOC_PARAMS)
 233 {
 234   tor_assert(size_mul_check(nmemb, size));
 235   return tor_malloc_zero_((nmemb * size) DMALLOC_FN_ARGS);
 236 }
 237
 238 /** Change the size of the memory block pointed to by <b>ptr</b> to <b>size</b>
 239  * bytes long; return the new memory block.  On error, log and
 240  * terminate. (Like realloc(ptr,size), but never returns NULL.)
 241  */
 242 void *
 243 tor_realloc_(void *ptr, size_t size DMALLOC_PARAMS)
 244 {
 245   void *result;
 246
 247   tor_assert(size < SIZE_T_CEILING);
 248
 249 #ifndef MALLOC_ZERO_WORKS
 250   /* Some libc mallocs don't work when size==0. Override them. */
 251   if (size==0) {
 252     size=1;
 253   }
 254 #endif
 255
 256 #ifdef USE_DMALLOC
 257   result = dmalloc_realloc(file, line, ptr, size, DMALLOC_FUNC_REALLOC, 0);
 258 #else
 259   result = realloc(ptr, size);
 260 #endif
 261
 262   if (PREDICT_UNLIKELY(result == NULL)) {
 263     log_err(LD_MM,"Out of memory on realloc(). Dying.");
 264     exit(1);
 265   }
 266   return result;
 267 }
 268
 269 /**
 270  * Try to realloc <b>ptr</b> so that it takes up sz1 * sz2 bytes.  Check for
 271  * overflow. Unlike other allocation functions, return NULL on overflow.
 272  */
 273 void *
 274 tor_reallocarray_(void *ptr, size_t sz1, size_t sz2 DMALLOC_PARAMS)
 275 {
 276   /* XXXX we can make this return 0, but we would need to check all the
 277    * reallocarray users. */
 278   tor_assert(size_mul_check(sz1, sz2));
 279
 280   return tor_realloc(ptr, (sz1 * sz2) DMALLOC_FN_ARGS);
 281 }
 282
 283 /** Return a newly allocated copy of the NUL-terminated string s. On
 284  * error, log and terminate.  (Like strdup(s), but never returns
 285  * NULL.)
 286  */
 287 char *
 288 tor_strdup_(const char *s DMALLOC_PARAMS)
 289 {
 290   char *dup;
 291   tor_assert(s);
 292
 293 #ifdef USE_DMALLOC
 294   dup = dmalloc_strdup(file, line, s, 0);
 295 #else
 296   dup = strdup(s);
 297 #endif
 298   if (PREDICT_UNLIKELY(dup == NULL)) {
 299     log_err(LD_MM,"Out of memory on strdup(). Dying.");
 300     exit(1);
 301   }
 302   return dup;
 303 }
 304
 305 /** Allocate and return a new string containing the first <b>n</b>
 306  * characters of <b>s</b>.  If <b>s</b> is longer than <b>n</b>
 307  * characters, only the first <b>n</b> are copied.  The result is
 308  * always NUL-terminated.  (Like strndup(s,n), but never returns
 309  * NULL.)
 310  */
 311 char *
 312 tor_strndup_(const char *s, size_t n DMALLOC_PARAMS)
 313 {
 314   char *dup;
 315   tor_assert(s);
 316   tor_assert(n < SIZE_T_CEILING);
 317   dup = tor_malloc_((n+1) DMALLOC_FN_ARGS);
 318   /* Performance note: Ordinarily we prefer strlcpy to strncpy.  But
 319    * this function gets called a whole lot, and platform strncpy is
 320    * much faster than strlcpy when strlen(s) is much longer than n.
 321    */
 322   strncpy(dup, s, n);
 323   dup[n]='\0';
 324   return dup;
 325 }
 326
 327 /** Allocate a chunk of <b>len</b> bytes, with the same contents as the
 328  * <b>len</b> bytes starting at <b>mem</b>. */
 329 void *
 330 tor_memdup_(const void *mem, size_t len DMALLOC_PARAMS)
 331 {
 332   char *dup;
 333   tor_assert(len < SIZE_T_CEILING);
 334   tor_assert(mem);
 335   dup = tor_malloc_(len DMALLOC_FN_ARGS);
 336   memcpy(dup, mem, len);
 337   return dup;
 338 }
 339
 340 /** As tor_memdup(), but add an extra 0 byte at the end of the resulting
 341  * memory. */
 342 void *
 343 tor_memdup_nulterm_(const void *mem, size_t len DMALLOC_PARAMS)
 344 {
 345   char *dup;
 346   tor_assert(len < SIZE_T_CEILING+1);
 347   tor_assert(mem);
 348   dup = tor_malloc_(len+1 DMALLOC_FN_ARGS);
 349   memcpy(dup, mem, len);
 350   dup[len] = '\0';
 351   return dup;
 352 }
 353
 354 /** Helper for places that need to take a function pointer to the right
 355  * spelling of "free()". */
 356 void
 357 tor_free_(void *mem)
 358 {
 359   tor_free(mem);
 360 }
 361
 362 /** Call the platform malloc info function, and dump the results to the log at
 363  * level <b>severity</b>.  If no such function exists, do nothing. */
 364 void
 365 tor_log_mallinfo(int severity)
 366 {
 367 #ifdef HAVE_MALLINFO
 368   struct mallinfo mi;
 369   memset(&mi, 0, sizeof(mi));
 370   mi = mallinfo();
 371   tor_log(severity, LD_MM,
 372       "mallinfo() said: arena=%d, ordblks=%d, smblks=%d, hblks=%d, "
 373       "hblkhd=%d, usmblks=%d, fsmblks=%d, uordblks=%d, fordblks=%d, "
 374       "keepcost=%d",
 375       mi.arena, mi.ordblks, mi.smblks, mi.hblks,
 376       mi.hblkhd, mi.usmblks, mi.fsmblks, mi.uordblks, mi.fordblks,
 377       mi.keepcost);
 378 #else
 379   (void)severity;
 380 #endif
 381 #ifdef USE_DMALLOC
 382   dmalloc_log_changed(0, /* Since the program started. */
 383                       1, /* Log info about non-freed pointers. */
 384                       0, /* Do not log info about freed pointers. */
 385                       0  /* Do not log individual pointers. */
 386                       );
 387 #endif
 388 }
 389
 390 /* =====
 391  * Math
 392  * ===== */
 393
 394 /**
 395  * Returns the natural logarithm of d base e.  We defined this wrapper here so
 396  * to avoid conflicts with old versions of tor_log(), which were named log().
 397  */
 398 double
 399 tor_mathlog(double d)
 400 {
 401   return log(d);
 402 }
 403
 404 /** Return the long integer closest to <b>d</b>. We define this wrapper
 405  * here so that not all users of math.h need to use the right incantations
 406  * to get the c99 functions. */
 407 long
 408 tor_lround(double d)
 409 {
 410 #if defined(HAVE_LROUND)
 411   return lround(d);
 412 #elif defined(HAVE_RINT)
 413   return (long)rint(d);
 414 #else
 415   return (long)(d > 0 ? d + 0.5 : ceil(d - 0.5));
 416 #endif
 417 }
 418
 419 /** Return the 64-bit integer closest to d.  We define this wrapper here so
 420  * that not all users of math.h need to use the right incantations to get the
 421  * c99 functions. */
 422 int64_t
 423 tor_llround(double d)
 424 {
 425 #if defined(HAVE_LLROUND)
 426   return (int64_t)llround(d);
 427 #elif defined(HAVE_RINT)
 428   return (int64_t)rint(d);
 429 #else
 430   return (int64_t)(d > 0 ? d + 0.5 : ceil(d - 0.5));
 431 #endif
 432 }
 433
 434 /** Returns floor(log2(u64)).  If u64 is 0, (incorrectly) returns 0. */
 435 int
 436 tor_log2(uint64_t u64)
 437 {
 438   int r = 0;
 439   if (u64 >= (U64_LITERAL(1)<<32)) {
 440     u64 >>= 32;
 441     r = 32;
 442   }
 443   if (u64 >= (U64_LITERAL(1)<<16)) {
 444     u64 >>= 16;
 445     r += 16;
 446   }
 447   if (u64 >= (U64_LITERAL(1)<<8)) {
 448     u64 >>= 8;
 449     r += 8;
 450   }
 451   if (u64 >= (U64_LITERAL(1)<<4)) {
 452     u64 >>= 4;
 453     r += 4;
 454   }
 455   if (u64 >= (U64_LITERAL(1)<<2)) {
 456     u64 >>= 2;
 457     r += 2;
 458   }
 459   if (u64 >= (U64_LITERAL(1)<<1)) {
 460     u64 >>= 1;
 461     r += 1;
 462   }
 463   return r;
 464 }
 465
 466 /** Return the power of 2 in range [1,UINT64_MAX] closest to <b>u64</b>.  If
 467  * there are two powers of 2 equally close, round down. */
 468 uint64_t
 469 round_to_power_of_2(uint64_t u64)
 470 {
 471   int lg2;
 472   uint64_t low;
 473   uint64_t high;
 474   if (u64 == 0)
 475     return 1;
 476
 477   lg2 = tor_log2(u64);
 478   low = U64_LITERAL(1) << lg2;
 479
 480   if (lg2 == 63)
 481     return low;
 482
 483   high = U64_LITERAL(1) << (lg2+1);
 484   if (high - u64 < u64 - low)
 485     return high;
 486   else
 487     return low;
 488 }
 489
 490 /** Return the lowest x such that x is at least <b>number</b>, and x modulo
 491  * <b>divisor</b> == 0.  If no such x can be expressed as an unsigned, return
 492  * UINT_MAX */
 493 unsigned
 494 round_to_next_multiple_of(unsigned number, unsigned divisor)
 495 {
 496   tor_assert(divisor > 0);
 497   if (UINT_MAX - divisor + 1 < number)
 498     return UINT_MAX;
 499   number += divisor - 1;
 500   number -= number % divisor;
 501   return number;
 502 }
 503
 504 /** Return the lowest x such that x is at least <b>number</b>, and x modulo
 505  * <b>divisor</b> == 0. If no such x can be expressed as a uint32_t, return
 506  * UINT32_MAX */
 507 uint32_t
 508 round_uint32_to_next_multiple_of(uint32_t number, uint32_t divisor)
 509 {
 510   tor_assert(divisor > 0);
 511   if (UINT32_MAX - divisor + 1 < number)
 512     return UINT32_MAX;
 513
 514   number += divisor - 1;
 515   number -= number % divisor;
 516   return number;
 517 }
 518
 519 /** Return the lowest x such that x is at least <b>number</b>, and x modulo
 520  * <b>divisor</b> == 0. If no such x can be expressed as a uint64_t, return
 521  * UINT64_MAX */
 522 uint64_t
 523 round_uint64_to_next_multiple_of(uint64_t number, uint64_t divisor)
 524 {
 525   tor_assert(divisor > 0);
 526   if (UINT64_MAX - divisor + 1 < number)
 527     return UINT64_MAX;
 528   number += divisor - 1;
 529   number -= number % divisor;
 530   return number;
 531 }
 532
 533 /** Return the lowest x in [INT64_MIN, INT64_MAX] such that x is at least
 534  * <b>number</b>, and x modulo <b>divisor</b> == 0. If no such x can be
 535  * expressed as an int64_t, return INT64_MAX */
 536 int64_t
 537 round_int64_to_next_multiple_of(int64_t number, int64_t divisor)
 538 {
 539   tor_assert(divisor > 0);
 540   if (INT64_MAX - divisor + 1 < number)
 541     return INT64_MAX;
 542   if (number >= 0)
 543     number += divisor - 1;
 544   number -= number % divisor;
 545   return number;
 546 }
 547
 548 /** Transform a random value <b>p</b> from the uniform distribution in
 549  * [0.0, 1.0[ into a Laplace distributed value with location parameter
 550  * <b>mu</b> and scale parameter <b>b</b>. Truncate the final result
 551  * to be an integer in [INT64_MIN, INT64_MAX]. */
 552 int64_t
 553 sample_laplace_distribution(double mu, double b, double p)
 554 {
 555   double result;
 556   tor_assert(p >= 0.0 && p < 1.0);
 557
 558   /* This is the "inverse cumulative distribution function" from:
 559    * http://en.wikipedia.org/wiki/Laplace_distribution */
 560   if (p <= 0.0) {
 561     /* Avoid taking log(0.0) == -INFINITY, as some processors or compiler
 562      * options can cause the program to trap. */
 563     return INT64_MIN;
 564   }
 565
 566   result = mu - b * (p > 0.5 ? 1.0 : -1.0)
 567                   * tor_mathlog(1.0 - 2.0 * fabs(p - 0.5));
 568
 569   return clamp_double_to_int64(result);
 570 }
 571
 572 /** Add random noise between INT64_MIN and INT64_MAX coming from a Laplace
 573  * distribution with mu = 0 and b = <b>delta_f</b>/<b>epsilon</b> to
 574  * <b>signal</b> based on the provided <b>random</b> value in [0.0, 1.0[.
 575  * The epsilon value must be between ]0.0, 1.0]. delta_f must be greater
 576  * than 0. */
 577 int64_t
 578 add_laplace_noise(int64_t signal, double random, double delta_f,
 579                   double epsilon)
 580 {
 581   int64_t noise;
 582
 583   /* epsilon MUST be between ]0.0, 1.0] */
 584   tor_assert(epsilon > 0.0 && epsilon <= 1.0);
 585   /* delta_f MUST be greater than 0. */
 586   tor_assert(delta_f > 0.0);
 587
 588   /* Just add noise, no further signal */
 589   noise = sample_laplace_distribution(0.0,
 590                                       delta_f / epsilon,
 591                                       random);
 592
 593   /* Clip (signal + noise) to [INT64_MIN, INT64_MAX] */
 594   if (noise > 0 && INT64_MAX - noise < signal)
 595     return INT64_MAX;
 596   else if (noise < 0 && INT64_MIN - noise > signal)
 597     return INT64_MIN;
 598   else
 599     return signal + noise;
 600 }
 601
 602 /** Return the number of bits set in <b>v</b>. */
 603 int
 604 n_bits_set_u8(uint8_t v)
 605 {
 606   static const int nybble_table[] = {
 607     0, /* 0000 */
 608     1, /* 0001 */
 609     1, /* 0010 */
 610     2, /* 0011 */
 611     1, /* 0100 */
 612     2, /* 0101 */
 613     2, /* 0110 */
 614     3, /* 0111 */
 615     1, /* 1000 */
 616     2, /* 1001 */
 617     2, /* 1010 */
 618     3, /* 1011 */
 619     2, /* 1100 */
 620     3, /* 1101 */
 621     3, /* 1110 */
 622     4, /* 1111 */
 623   };
 624
 625   return nybble_table[v & 15] + nybble_table[v>>4];
 626 }
 627
 628 /* =====
 629  * String manipulation
 630  * ===== */
 631
 632 /** Remove from the string <b>s</b> every character which appears in
 633  * <b>strip</b>. */
 634 void
 635 tor_strstrip(char *s, const char *strip)
 636 {
 637   char *read = s;
 638   while (*read) {
 639     if (strchr(strip, *read)) {
 640       ++read;
 641     } else {
 642       *s++ = *read++;
 643     }
 644   }
 645   *s = '\0';
 646 }
 647
 648 /** Return a pointer to a NUL-terminated hexadecimal string encoding
 649  * the first <b>fromlen</b> bytes of <b>from</b>. (fromlen must be \<= 32.) The
 650  * result does not need to be deallocated, but repeated calls to
 651  * hex_str will trash old results.
 652  */
 653 const char *
 654 hex_str(const char *from, size_t fromlen)
 655 {
 656   static char buf[65];
 657   if (fromlen>(sizeof(buf)-1)/2)
 658     fromlen = (sizeof(buf)-1)/2;
 659   base16_encode(buf,sizeof(buf),from,fromlen);
 660   return buf;
 661 }
 662
 663 /** Convert all alphabetic characters in the nul-terminated string <b>s</b> to
 664  * lowercase. */
 665 void
 666 tor_strlower(char *s)
 667 {
 668   while (*s) {
 669     *s = TOR_TOLOWER(*s);
 670     ++s;
 671   }
 672 }
 673
 674 /** Convert all alphabetic characters in the nul-terminated string <b>s</b> to
 675  * lowercase. */
 676 void
 677 tor_strupper(char *s)
 678 {
 679   while (*s) {
 680     *s = TOR_TOUPPER(*s);
 681     ++s;
 682   }
 683 }
 684
 685 /** Return 1 if every character in <b>s</b> is printable, else return 0.
 686  */
 687 int
 688 tor_strisprint(const char *s)
 689 {
 690   while (*s) {
 691     if (!TOR_ISPRINT(*s))
 692       return 0;
 693     s++;
 694   }
 695   return 1;
 696 }
 697
 698 /** Return 1 if no character in <b>s</b> is uppercase, else return 0.
 699  */
 700 int
 701 tor_strisnonupper(const char *s)
 702 {
 703   while (*s) {
 704     if (TOR_ISUPPER(*s))
 705       return 0;
 706     s++;
 707   }
 708   return 1;
 709 }
 710
 711 /** As strcmp, except that either string may be NULL.  The NULL string is
 712  * considered to be before any non-NULL string. */
 713 int
 714 strcmp_opt(const char *s1, const char *s2)
 715 {
 716   if (!s1) {
 717     if (!s2)
 718       return 0;
 719     else
 720       return -1;
 721   } else if (!s2) {
 722     return 1;
 723   } else {
 724     return strcmp(s1, s2);
 725   }
 726 }
 727
 728 /** Compares the first strlen(s2) characters of s1 with s2.  Returns as for
 729  * strcmp.
 730  */
 731 int
 732 strcmpstart(const char *s1, const char *s2)
 733 {
 734   size_t n = strlen(s2);
 735   return strncmp(s1, s2, n);
 736 }
 737
 738 /** Compare the s1_len-byte string <b>s1</b> with <b>s2</b>,
 739  * without depending on a terminating nul in s1.  Sorting order is first by
 740  * length, then lexically; return values are as for strcmp.
 741  */
 742 int
 743 strcmp_len(const char *s1, const char *s2, size_t s1_len)
 744 {
 745   size_t s2_len = strlen(s2);
 746   if (s1_len < s2_len)
 747     return -1;
 748   if (s1_len > s2_len)
 749     return 1;
 750   return fast_memcmp(s1, s2, s2_len);
 751 }
 752
 753 /** Compares the first strlen(s2) characters of s1 with s2.  Returns as for
 754  * strcasecmp.
 755  */
 756 int
 757 strcasecmpstart(const char *s1, const char *s2)
 758 {
 759   size_t n = strlen(s2);
 760   return strncasecmp(s1, s2, n);
 761 }
 762
 763 /** Compares the last strlen(s2) characters of s1 with s2.  Returns as for
 764  * strcmp.
 765  */
 766 int
 767 strcmpend(const char *s1, const char *s2)
 768 {
 769   size_t n1 = strlen(s1), n2 = strlen(s2);
 770   if (n2>n1)
 771     return strcmp(s1,s2);
 772   else
 773     return strncmp(s1+(n1-n2), s2, n2);
 774 }
 775
 776 /** Compares the last strlen(s2) characters of s1 with s2.  Returns as for
 777  * strcasecmp.
 778  */
 779 int
 780 strcasecmpend(const char *s1, const char *s2)
 781 {
 782   size_t n1 = strlen(s1), n2 = strlen(s2);
 783   if (n2>n1) /* then they can't be the same; figure out which is bigger */
 784     return strcasecmp(s1,s2);
 785   else
 786     return strncasecmp(s1+(n1-n2), s2, n2);
 787 }
 788
 789 /** Compare the value of the string <b>prefix</b> with the start of the
 790  * <b>memlen</b>-byte memory chunk at <b>mem</b>.  Return as for strcmp.
 791  *
 792  * [As fast_memcmp(mem, prefix, strlen(prefix)) but returns -1 if memlen is
 793  * less than strlen(prefix).]
 794  */
 795 int
 796 fast_memcmpstart(const void *mem, size_t memlen,
 797                 const char *prefix)
 798 {
 799   size_t plen = strlen(prefix);
 800   if (memlen < plen)
 801     return -1;
 802   return fast_memcmp(mem, prefix, plen);
 803 }
 804
 805 /** Return a pointer to the first char of s that is not whitespace and
 806  * not a comment, or to the terminating NUL if no such character exists.
 807  */
 808 const char *
 809 eat_whitespace(const char *s)
 810 {
 811   tor_assert(s);
 812
 813   while (1) {
 814     switch (*s) {
 815     case '\0':
 816     default:
 817       return s;
 818     case ' ':
 819     case '\t':
 820     case '\n':
 821     case '\r':
 822       ++s;
 823       break;
 824     case '#':
 825       ++s;
 826       while (*s && *s != '\n')
 827         ++s;
 828     }
 829   }
 830 }
 831
 832 /** Return a pointer to the first char of s that is not whitespace and
 833  * not a comment, or to the terminating NUL if no such character exists.
 834  */
 835 const char *
 836 eat_whitespace_eos(const char *s, const char *eos)
 837 {
 838   tor_assert(s);
 839   tor_assert(eos && s <= eos);
 840
 841   while (s < eos) {
 842     switch (*s) {
 843     case '\0':
 844     default:
 845       return s;
 846     case ' ':
 847     case '\t':
 848     case '\n':
 849     case '\r':
 850       ++s;
 851       break;
 852     case '#':
 853       ++s;
 854       while (s < eos && *s && *s != '\n')
 855         ++s;
 856     }
 857   }
 858   return s;
 859 }
 860
 861 /** Return a pointer to the first char of s that is not a space or a tab
 862  * or a \\r, or to the terminating NUL if no such character exists. */
 863 const char *
 864 eat_whitespace_no_nl(const char *s)
 865 {
 866   while (*s == ' ' || *s == '\t' || *s == '\r')
 867     ++s;
 868   return s;
 869 }
 870
 871 /** As eat_whitespace_no_nl, but stop at <b>eos</b> whether we have
 872  * found a non-whitespace character or not. */
 873 const char *
 874 eat_whitespace_eos_no_nl(const char *s, const char *eos)
 875 {
 876   while (s < eos && (*s == ' ' || *s == '\t' || *s == '\r'))
 877     ++s;
 878   return s;
 879 }
 880
 881 /** Return a pointer to the first char of s that is whitespace or <b>#</b>,
 882  * or to the terminating NUL if no such character exists.
 883  */
 884 const char *
 885 find_whitespace(const char *s)
 886 {
 887   /* tor_assert(s); */
 888   while (1) {
 889     switch (*s)
 890     {
 891     case '\0':
 892     case '#':
 893     case ' ':
 894     case '\r':
 895     case '\n':
 896     case '\t':
 897       return s;
 898     default:
 899       ++s;
 900     }
 901   }
 902 }
 903
 904 /** As find_whitespace, but stop at <b>eos</b> whether we have found a
 905  * whitespace or not. */
 906 const char *
 907 find_whitespace_eos(const char *s, const char *eos)
 908 {
 909   /* tor_assert(s); */
 910   while (s < eos) {
 911     switch (*s)
 912     {
 913     case '\0':
 914     case '#':
 915     case ' ':
 916     case '\r':
 917     case '\n':
 918     case '\t':
 919       return s;
 920     default:
 921       ++s;
 922     }
 923   }
 924   return s;
 925 }
 926
 927 /** Return the first occurrence of <b>needle</b> in <b>haystack</b> that
 928  * occurs at the start of a line (that is, at the beginning of <b>haystack</b>
 929  * or immediately after a newline).  Return NULL if no such string is found.
 930  */
 931 const char *
 932 find_str_at_start_of_line(const char *haystack, const char *needle)
 933 {
 934   size_t needle_len = strlen(needle);
 935
 936   do {
 937     if (!strncmp(haystack, needle, needle_len))
 938       return haystack;
 939
 940     haystack = strchr(haystack, '\n');
 941     if (!haystack)
 942       return NULL;
 943     else
 944       ++haystack;
 945   } while (*haystack);
 946
 947   return NULL;
 948 }
 949
 950 /** Returns true if <b>string</b> could be a C identifier.
 951     A C identifier must begin with a letter or an underscore and the
 952     rest of its characters can be letters, numbers or underscores. No
 953     length limit is imposed. */
 954 int
 955 string_is_C_identifier(const char *string)
 956 {
 957   size_t iter;
 958   size_t length = strlen(string);
 959   if (!length)
 960     return 0;
 961
 962   for (iter = 0; iter < length ; iter++) {
 963     if (iter == 0) {
 964       if (!(TOR_ISALPHA(string[iter]) ||
 965             string[iter] == '_'))
 966         return 0;
 967     } else {
 968       if (!(TOR_ISALPHA(string[iter]) ||
 969             TOR_ISDIGIT(string[iter]) ||
 970             string[iter] == '_'))
 971         return 0;
 972     }
 973   }
 974
 975   return 1;
 976 }
 977
 978 /** Return true iff the 'len' bytes at 'mem' are all zero. */
 979 int
 980 tor_mem_is_zero(const char *mem, size_t len)
 981 {
 982   static const char ZERO[] = {
 983     0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0,
 984   };
 985   while (len >= sizeof(ZERO)) {
 986     /* It's safe to use fast_memcmp here, since the very worst thing an
 987      * attacker could learn is how many initial bytes of a secret were zero */
 988     if (fast_memcmp(mem, ZERO, sizeof(ZERO)))
 989       return 0;
 990     len -= sizeof(ZERO);
 991     mem += sizeof(ZERO);
 992   }
 993   /* Deal with leftover bytes. */
 994   if (len)
 995     return fast_memeq(mem, ZERO, len);
 996
 997   return 1;
 998 }
 999
1000 /** Return true iff the DIGEST_LEN bytes in digest are all zero. */
1001 int
1002 tor_digest_is_zero(const char *digest)
1003 {
1004   static const uint8_t ZERO_DIGEST[] = {
1005     0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0
1006   };
1007   return tor_memeq(digest, ZERO_DIGEST, DIGEST_LEN);
1008 }
1009
1010 /** Return true if <b>string</b> is a valid 'key=[value]' string.
1011  *  "value" is optional, to indicate the empty string. Log at logging
1012  *  <b>severity</b> if something ugly happens. */
1013 int
1014 string_is_key_value(int severity, const char *string)
1015 {
1016   /* position of equal sign in string */
1017   const char *equal_sign_pos = NULL;
1018
1019   tor_assert(string);
1020
1021   if (strlen(string) < 2) { /* "x=" is shortest args string */
1022     tor_log(severity, LD_GENERAL, "'%s' is too short to be a k=v value.",
1023             escaped(string));
1024     return 0;
1025   }
1026
1027   equal_sign_pos = strchr(string, '=');
1028   if (!equal_sign_pos) {
1029     tor_log(severity, LD_GENERAL, "'%s' is not a k=v value.", escaped(string));
1030     return 0;
1031   }
1032
1033   /* validate that the '=' is not in the beginning of the string. */
1034   if (equal_sign_pos == string) {
1035     tor_log(severity, LD_GENERAL, "'%s' is not a valid k=v value.",
1036             escaped(string));
1037     return 0;
1038   }
1039
1040   return 1;
1041 }
1042
1043 /** Return true if <b>string</b> represents a valid IPv4 adddress in
1044  * 'a.b.c.d' form.
1045  */
1046 int
1047 string_is_valid_ipv4_address(const char *string)
1048 {
1049   struct in_addr addr;
1050
1051   return (tor_inet_pton(AF_INET,string,&addr) == 1);
1052 }
1053
1054 /** Return true if <b>string</b> represents a valid IPv6 address in
1055  * a form that inet_pton() can parse.
1056  */
1057 int
1058 string_is_valid_ipv6_address(const char *string)
1059 {
1060   struct in6_addr addr;
1061
1062   return (tor_inet_pton(AF_INET6,string,&addr) == 1);
1063 }
1064
1065 /** Return true iff <b>string</b> matches a pattern of DNS names
1066  * that we allow Tor clients to connect to.
1067  *
1068  * Note: This allows certain technically invalid characters ('_') to cope
1069  * with misconfigured zones that have been encountered in the wild.
1070  */
1071 int
1072 string_is_valid_hostname(const char *string)
1073 {
1074   int result = 1;
1075   smartlist_t *components;
1076
1077   components = smartlist_new();
1078
1079   smartlist_split_string(components,string,".",0,0);
1080
1081   SMARTLIST_FOREACH_BEGIN(components, char *, c) {
1082     if ((c[0] == '-') || (*c == '_')) {
1083       result = 0;
1084       break;
1085     }
1086
1087     /* Allow a single terminating '.' used rarely to indicate domains
1088      * are FQDNs rather than relative. */
1089     if ((c_sl_idx > 0) && (c_sl_idx + 1 == c_sl_len) && !*c) {
1090       continue;
1091     }
1092
1093     do {
1094       if ((*c >= 'a' && *c <= 'z') ||
1095           (*c >= 'A' && *c <= 'Z') ||
1096           (*c >= '0' && *c <= '9') ||
1097           (*c == '-') || (*c == '_'))
1098         c++;
1099       else
1100         result = 0;
1101     } while (result && *c);
1102
1103   } SMARTLIST_FOREACH_END(c);
1104
1105   SMARTLIST_FOREACH_BEGIN(components, char *, c) {
1106     tor_free(c);
1107   } SMARTLIST_FOREACH_END(c);
1108
1109   smartlist_free(components);
1110
1111   return result;
1112 }
1113
1114 /** Return true iff the DIGEST256_LEN bytes in digest are all zero. */
1115 int
1116 tor_digest256_is_zero(const char *digest)
1117 {
1118   return tor_mem_is_zero(digest, DIGEST256_LEN);
1119 }
1120
1121 /* Helper: common code to check whether the result of a strtol or strtoul or
1122  * strtoll is correct. */
1123 #define CHECK_STRTOX_RESULT()                           \
1124   /* Did an overflow occur? */                          \
1125   if (errno == ERANGE)                                  \
1126     goto err;                                           \
1127   /* Was at least one character converted? */           \
1128   if (endptr == s)                                      \
1129     goto err;                                           \
1130   /* Were there unexpected unconverted characters? */   \
1131   if (!next && *endptr)                                 \
1132     goto err;                                           \
1133   /* Is r within limits? */                             \
1134   if (r < min || r > max)                               \
1135     goto err;                                           \
1136   if (ok) *ok = 1;                                      \
1137   if (next) *next = endptr;                             \
1138   return r;                                             \
1139  err:                                                   \
1140   if (ok) *ok = 0;                                      \
1141   if (next) *next = endptr;                             \
1142   return 0
1143
1144 /** Extract a long from the start of <b>s</b>, in the given numeric
1145  * <b>base</b>.  If <b>base</b> is 0, <b>s</b> is parsed as a decimal,
1146  * octal, or hex number in the syntax of a C integer literal.  If
1147  * there is unconverted data and <b>next</b> is provided, set
1148  * *<b>next</b> to the first unconverted character.  An error has
1149  * occurred if no characters are converted; or if there are
1150  * unconverted characters and <b>next</b> is NULL; or if the parsed
1151  * value is not between <b>min</b> and <b>max</b>.  When no error
1152  * occurs, return the parsed value and set *<b>ok</b> (if provided) to
1153  * 1.  When an error occurs, return 0 and set *<b>ok</b> (if provided)
1154  * to 0.
1155  */
1156 long
1157 tor_parse_long(const char *s, int base, long min, long max,
1158                int *ok, char **next)
1159 {
1160   char *endptr;
1161   long r;
1162
1163   if (base < 0) {
1164     if (ok)
1165       *ok = 0;
1166     return 0;
1167   }
1168
1169   errno = 0;
1170   r = strtol(s, &endptr, base);
1171   CHECK_STRTOX_RESULT();
1172 }
1173
1174 /** As tor_parse_long(), but return an unsigned long. */
1175 unsigned long
1176 tor_parse_ulong(const char *s, int base, unsigned long min,
1177                 unsigned long max, int *ok, char **next)
1178 {
1179   char *endptr;
1180   unsigned long r;
1181
1182   if (base < 0) {
1183     if (ok)
1184       *ok = 0;
1185     return 0;
1186   }
1187
1188   errno = 0;
1189   r = strtoul(s, &endptr, base);
1190   CHECK_STRTOX_RESULT();
1191 }
1192
1193 /** As tor_parse_long(), but return a double. */
1194 double
1195 tor_parse_double(const char *s, double min, double max, int *ok, char **next)
1196 {
1197   char *endptr;
1198   double r;
1199
1200   errno = 0;
1201   r = strtod(s, &endptr);
1202   CHECK_STRTOX_RESULT();
1203 }
1204
1205 /** As tor_parse_long, but return a uint64_t.  Only base 10 is guaranteed to
1206  * work for now. */
1207 uint64_t
1208 tor_parse_uint64(const char *s, int base, uint64_t min,
1209                  uint64_t max, int *ok, char **next)
1210 {
1211   char *endptr;
1212   uint64_t r;
1213
1214   if (base < 0) {
1215     if (ok)
1216       *ok = 0;
1217     return 0;
1218   }
1219
1220   errno = 0;
1221 #ifdef HAVE_STRTOULL
1222   r = (uint64_t)strtoull(s, &endptr, base);
1223 #elif defined(_WIN32)
1224 #if defined(_MSC_VER) && _MSC_VER < 1300
1225   tor_assert(base <= 10);
1226   r = (uint64_t)_atoi64(s);
1227   endptr = (char*)s;
1228   while (TOR_ISSPACE(*endptr)) endptr++;
1229   while (TOR_ISDIGIT(*endptr)) endptr++;
1230 #else
1231   r = (uint64_t)_strtoui64(s, &endptr, base);
1232 #endif
1233 #elif SIZEOF_LONG == 8
1234   r = (uint64_t)strtoul(s, &endptr, base);
1235 #else
1236 #error "I don't know how to parse 64-bit numbers."
1237 #endif
1238
1239   CHECK_STRTOX_RESULT();
1240 }
1241
1242 /** Allocate and return a new string representing the contents of <b>s</b>,
1243  * surrounded by quotes and using standard C escapes.
1244  *
1245  * Generally, we use this for logging values that come in over the network to
1246  * keep them from tricking users, and for sending certain values to the
1247  * controller.
1248  *
1249  * We trust values from the resolver, OS, configuration file, and command line
1250  * to not be maliciously ill-formed.  We validate incoming routerdescs and
1251  * SOCKS requests and addresses from BEGIN cells as they're parsed;
1252  * afterwards, we trust them as non-malicious.
1253  */
1254 char *
1255 esc_for_log(const char *s)
1256 {
1257   const char *cp;
1258   char *result, *outp;
1259   size_t len = 3;
1260   if (!s) {
1261     return tor_strdup("(null)");
1262   }
1263
1264   for (cp = s; *cp; ++cp) {
1265     switch (*cp) {
1266       case '\\':
1267       case '\"':
1268       case '\'':
1269       case '\r':
1270       case '\n':
1271       case '\t':
1272         len += 2;
1273         break;
1274       default:
1275         if (TOR_ISPRINT(*cp) && ((uint8_t)*cp)<127)
1276           ++len;
1277         else
1278           len += 4;
1279         break;
1280     }
1281   }
1282
1283   tor_assert(len <= SSIZE_MAX);
1284
1285   result = outp = tor_malloc(len);
1286   *outp++ = '\"';
1287   for (cp = s; *cp; ++cp) {
1288     /* This assertion should always succeed, since we will write at least
1289      * one char here, and two chars for closing quote and nul later */
1290     tor_assert((outp-result) < (ssize_t)len-2);
1291     switch (*cp) {
1292       case '\\':
1293       case '\"':
1294       case '\'':
1295         *outp++ = '\\';
1296         *outp++ = *cp;
1297         break;
1298       case '\n':
1299         *outp++ = '\\';
1300         *outp++ = 'n';
1301         break;
1302       case '\t':
1303         *outp++ = '\\';
1304         *outp++ = 't';
1305         break;
1306       case '\r':
1307         *outp++ = '\\';
1308         *outp++ = 'r';
1309         break;
1310       default:
1311         if (TOR_ISPRINT(*cp) && ((uint8_t)*cp)<127) {
1312           *outp++ = *cp;
1313         } else {
1314           tor_assert((outp-result) < (ssize_t)len-4);
1315           tor_snprintf(outp, 5, "\\%03o", (int)(uint8_t) *cp);
1316           outp += 4;
1317         }
1318         break;
1319     }
1320   }
1321
1322   tor_assert((outp-result) <= (ssize_t)len-2);
1323   *outp++ = '\"';
1324   *outp++ = 0;
1325
1326   return result;
1327 }
1328
1329 /** Similar to esc_for_log. Allocate and return a new string representing
1330  * the first n characters in <b>chars</b>, surround by quotes and using
1331  * standard C escapes. If a NUL character is encountered in <b>chars</b>,
1332  * the resulting string will be terminated there.
1333  */
1334 char *
1335 esc_for_log_len(const char *chars, size_t n)
1336 {
1337   char *string = tor_strndup(chars, n);
1338   char *string_escaped = esc_for_log(string);
1339   tor_free(string);
1340   return string_escaped;
1341 }
1342
1343 /** Allocate and return a new string representing the contents of <b>s</b>,
1344  * surrounded by quotes and using standard C escapes.
1345  *
1346  * THIS FUNCTION IS NOT REENTRANT.  Don't call it from outside the main
1347  * thread.  Also, each call invalidates the last-returned value, so don't
1348  * try log_warn(LD_GENERAL, "%s %s", escaped(a), escaped(b));
1349  */
1350 const char *
1351 escaped(const char *s)
1352 {
1353   static char *escaped_val_ = NULL;
1354   tor_free(escaped_val_);
1355
1356   if (s)
1357     escaped_val_ = esc_for_log(s);
1358   else
1359     escaped_val_ = NULL;
1360
1361   return escaped_val_;
1362 }
1363
1364 /** Return a newly allocated string equal to <b>string</b>, except that every
1365  * character in <b>chars_to_escape</b> is preceded by a backslash. */
1366 char *
1367 tor_escape_str_for_pt_args(const char *string, const char *chars_to_escape)
1368 {
1369   char *new_string = NULL;
1370   char *new_cp = NULL;
1371   size_t length, new_length;
1372
1373   tor_assert(string);
1374
1375   length = strlen(string);
1376
1377   if (!length) /* If we were given the empty string, return the same. */
1378     return tor_strdup("");
1379   /* (new_length > SIZE_MAX) => ((length * 2) + 1 > SIZE_MAX) =>
1380      (length*2 > SIZE_MAX - 1) => (length > (SIZE_MAX - 1)/2) */
1381   if (length > (SIZE_MAX - 1)/2) /* check for overflow */
1382     return NULL;
1383
1384   /* this should be enough even if all characters must be escaped */
1385   new_length = (length * 2) + 1;
1386
1387   new_string = new_cp = tor_malloc(new_length);
1388
1389   while (*string) {
1390     if (strchr(chars_to_escape, *string))
1391       *new_cp++ = '\\';
1392
1393     *new_cp++ = *string++;
1394   }
1395
1396   *new_cp = '\0'; /* NUL-terminate the new string */
1397
1398   return new_string;
1399 }
1400
1401 /* =====
1402  * Time
1403  * ===== */
1404
1405 /** Return the number of microseconds elapsed between *start and *end.
1406  */
1407 long
1408 tv_udiff(const struct timeval *start, const struct timeval *end)
1409 {
1410   long udiff;
1411   long secdiff = end->tv_sec - start->tv_sec;
1412
1413   if (labs(secdiff+1) > LONG_MAX/1000000) {
1414     log_warn(LD_GENERAL, "comparing times on microsecond detail too far "
1415              "apart: %ld seconds", secdiff);
1416     return LONG_MAX;
1417   }
1418
1419   udiff = secdiff*1000000L + (end->tv_usec - start->tv_usec);
1420   return udiff;
1421 }
1422
1423 /** Return the number of milliseconds elapsed between *start and *end.
1424  */
1425 long
1426 tv_mdiff(const struct timeval *start, const struct timeval *end)
1427 {
1428   long mdiff;
1429   long secdiff = end->tv_sec - start->tv_sec;
1430
1431   if (labs(secdiff+1) > LONG_MAX/1000) {
1432     log_warn(LD_GENERAL, "comparing times on millisecond detail too far "
1433              "apart: %ld seconds", secdiff);
1434     return LONG_MAX;
1435   }
1436
1437   /* Subtract and round */
1438   mdiff = secdiff*1000L +
1439       ((long)end->tv_usec - (long)start->tv_usec + 500L) / 1000L;
1440   return mdiff;
1441 }
1442
1443 /**
1444  * Converts timeval to milliseconds.
1445  */
1446 int64_t
1447 tv_to_msec(const struct timeval *tv)
1448 {
1449   int64_t conv = ((int64_t)tv->tv_sec)*1000L;
1450   /* Round ghetto-style */
1451   conv += ((int64_t)tv->tv_usec+500)/1000L;
1452   return conv;
1453 }
1454
1455 /** Yield true iff <b>y</b> is a leap-year. */
1456 #define IS_LEAPYEAR(y) (!(y % 4) && ((y % 100) || !(y % 400)))
1457 /** Helper: Return the number of leap-days between Jan 1, y1 and Jan 1, y2. */
1458 static int
1459 n_leapdays(int y1, int y2)
1460 {
1461   --y1;
1462   --y2;
1463   return (y2/4 - y1/4) - (y2/100 - y1/100) + (y2/400 - y1/400);
1464 }
1465 /** Number of days per month in non-leap year; used by tor_timegm and
1466  * parse_rfc1123_time. */
1467 static const int days_per_month[] =
1468   { 31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31};
1469
1470 /** Compute a time_t given a struct tm.  The result is given in UTC, and
1471  * does not account for leap seconds.  Return 0 on success, -1 on failure.
1472  */
1473 int
1474 tor_timegm(const struct tm *tm, time_t *time_out)
1475 {
1476   /* This is a pretty ironclad timegm implementation, snarfed from Python2.2.
1477    * It's way more brute-force than fiddling with tzset().
1478    */
1479   time_t year, days, hours, minutes, seconds;
1480   int i, invalid_year, dpm;
1481   /* avoid int overflow on addition */
1482   if (tm->tm_year < INT32_MAX-1900) {
1483     year = tm->tm_year + 1900;
1484   } else {
1485     /* clamp year */
1486     year = INT32_MAX;
1487   }
1488   invalid_year = (year < 1970 || tm->tm_year >= INT32_MAX-1900);
1489
1490   if (tm->tm_mon >= 0 && tm->tm_mon <= 11) {
1491     dpm = days_per_month[tm->tm_mon];
1492     if (tm->tm_mon == 1 && !invalid_year && IS_LEAPYEAR(tm->tm_year)) {
1493       dpm = 29;
1494     }
1495   } else {
1496     /* invalid month - default to 0 days per month */
1497     dpm = 0;
1498   }
1499
1500   if (invalid_year ||
1501       tm->tm_mon < 0 || tm->tm_mon > 11 ||
1502       tm->tm_mday < 1 || tm->tm_mday > dpm ||
1503       tm->tm_hour < 0 || tm->tm_hour > 23 ||
1504       tm->tm_min < 0 || tm->tm_min > 59 ||
1505       tm->tm_sec < 0 || tm->tm_sec > 60) {
1506     log_warn(LD_BUG, "Out-of-range argument to tor_timegm");
1507     return -1;
1508   }
1509   days = 365 * (year-1970) + n_leapdays(1970,(int)year);
1510   for (i = 0; i < tm->tm_mon; ++i)
1511     days += days_per_month[i];
1512   if (tm->tm_mon > 1 && IS_LEAPYEAR(year))
1513     ++days;
1514   days += tm->tm_mday - 1;
1515   hours = days*24 + tm->tm_hour;
1516
1517   minutes = hours*60 + tm->tm_min;
1518   seconds = minutes*60 + tm->tm_sec;
1519   *time_out = seconds;
1520   return 0;
1521 }
1522
1523 /* strftime is locale-specific, so we need to replace those parts */
1524
1525 /** A c-locale array of 3-letter names of weekdays, starting with Sun. */
1526 static const char *WEEKDAY_NAMES[] =
1527   { "Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat" };
1528 /** A c-locale array of 3-letter names of months, starting with Jan. */
1529 static const char *MONTH_NAMES[] =
1530   { "Jan", "Feb", "Mar", "Apr", "May", "Jun",
1531     "Jul", "Aug", "Sep", "Oct", "Nov", "Dec" };
1532
1533 /** Set <b>buf</b> to the RFC1123 encoding of the UTC value of <b>t</b>.
1534  * The buffer must be at least RFC1123_TIME_LEN+1 bytes long.
1535  *
1536  * (RFC1123 format is "Fri, 29 Sep 2006 15:54:20 GMT". Note the "GMT"
1537  * rather than "UTC".)
1538  */
1539 void
1540 format_rfc1123_time(char *buf, time_t t)
1541 {
1542   struct tm tm;
1543
1544   tor_gmtime_r(&t, &tm);
1545
1546   strftime(buf, RFC1123_TIME_LEN+1, "___, %d ___ %Y %H:%M:%S GMT", &tm);
1547   tor_assert(tm.tm_wday >= 0);
1548   tor_assert(tm.tm_wday <= 6);
1549   memcpy(buf, WEEKDAY_NAMES[tm.tm_wday], 3);
1550   tor_assert(tm.tm_mon >= 0);
1551   tor_assert(tm.tm_mon <= 11);
1552   memcpy(buf+8, MONTH_NAMES[tm.tm_mon], 3);
1553 }
1554
1555 /** Parse the (a subset of) the RFC1123 encoding of some time (in UTC) from
1556  * <b>buf</b>, and store the result in *<b>t</b>.
1557  *
1558  * Note that we only accept the subset generated by format_rfc1123_time above,
1559  * not the full range of formats suggested by RFC 1123.
1560  *
1561  * Return 0 on success, -1 on failure.
1562 */
1563 int
1564 parse_rfc1123_time(const char *buf, time_t *t)
1565 {
1566   struct tm tm;
1567   char month[4];
1568   char weekday[4];
1569   int i, m, invalid_year;
1570   unsigned tm_mday, tm_year, tm_hour, tm_min, tm_sec;
1571   unsigned dpm;
1572
1573   if (strlen(buf) != RFC1123_TIME_LEN)
1574     return -1;
1575   memset(&tm, 0, sizeof(tm));
1576   if (tor_sscanf(buf, "%3s, %2u %3s %u %2u:%2u:%2u GMT", weekday,
1577              &tm_mday, month, &tm_year, &tm_hour,
1578              &tm_min, &tm_sec) < 7) {
1579     char *esc = esc_for_log(buf);
1580     log_warn(LD_GENERAL, "Got invalid RFC1123 time %s", esc);
1581     tor_free(esc);
1582     return -1;
1583   }
1584
1585   m = -1;
1586   for (i = 0; i < 12; ++i) {
1587     if (!strcmp(month, MONTH_NAMES[i])) {
1588       m = i;
1589       break;
1590     }
1591   }
1592   if (m<0) {
1593     char *esc = esc_for_log(buf);
1594     log_warn(LD_GENERAL, "Got invalid RFC1123 time %s: No such month", esc);
1595     tor_free(esc);
1596     return -1;
1597   }
1598   tm.tm_mon = m;
1599
1600   invalid_year = (tm_year >= INT32_MAX || tm_year < 1970);
1601   tor_assert(m >= 0 && m <= 11);
1602   dpm = days_per_month[m];
1603   if (m == 1 && !invalid_year && IS_LEAPYEAR(tm_year)) {
1604     dpm = 29;
1605   }
1606
1607   if (invalid_year || tm_mday < 1 || tm_mday > dpm ||
1608       tm_hour > 23 || tm_min > 59 || tm_sec > 60) {
1609     char *esc = esc_for_log(buf);
1610     log_warn(LD_GENERAL, "Got invalid RFC1123 time %s", esc);
1611     tor_free(esc);
1612     return -1;
1613   }
1614   tm.tm_mday = (int)tm_mday;
1615   tm.tm_year = (int)tm_year;
1616   tm.tm_hour = (int)tm_hour;
1617   tm.tm_min = (int)tm_min;
1618   tm.tm_sec = (int)tm_sec;
1619
1620   if (tm.tm_year < 1970) {
1621     char *esc = esc_for_log(buf);
1622     log_warn(LD_GENERAL,
1623              "Got invalid RFC1123 time %s. (Before 1970)", esc);
1624     tor_free(esc);
1625     return -1;
1626   }
1627   tm.tm_year -= 1900;
1628
1629   return tor_timegm(&tm, t);
1630 }
1631
1632 /** Set <b>buf</b> to the ISO8601 encoding of the local value of <b>t</b>.
1633  * The buffer must be at least ISO_TIME_LEN+1 bytes long.
1634  *
1635  * (ISO8601 format is 2006-10-29 10:57:20)
1636  */
1637 void
1638 format_local_iso_time(char *buf, time_t t)
1639 {
1640   struct tm tm;
1641   strftime(buf, ISO_TIME_LEN+1, "%Y-%m-%d %H:%M:%S", tor_localtime_r(&t, &tm));
1642 }
1643
1644 /** Set <b>buf</b> to the ISO8601 encoding of the GMT value of <b>t</b>.
1645  * The buffer must be at least ISO_TIME_LEN+1 bytes long.
1646  */
1647 void
1648 format_iso_time(char *buf, time_t t)
1649 {
1650   struct tm tm;
1651   strftime(buf, ISO_TIME_LEN+1, "%Y-%m-%d %H:%M:%S", tor_gmtime_r(&t, &tm));
1652 }
1653
1654 /** As format_iso_time, but use the yyyy-mm-ddThh:mm:ss format to avoid
1655  * embedding an internal space. */
1656 void
1657 format_iso_time_nospace(char *buf, time_t t)
1658 {
1659   format_iso_time(buf, t);
1660   buf[10] = 'T';
1661 }
1662
1663 /** As format_iso_time_nospace, but include microseconds in decimal
1664  * fixed-point format.  Requires that buf be at least ISO_TIME_USEC_LEN+1
1665  * bytes long. */
1666 void
1667 format_iso_time_nospace_usec(char *buf, const struct timeval *tv)
1668 {
1669   tor_assert(tv);
1670   format_iso_time_nospace(buf, (time_t)tv->tv_sec);
1671   tor_snprintf(buf+ISO_TIME_LEN, 8, ".%06d", (int)tv->tv_usec);
1672 }
1673
1674 /** Given an ISO-formatted UTC time value (after the epoch) in <b>cp</b>,
1675  * parse it and store its value in *<b>t</b>.  Return 0 on success, -1 on
1676  * failure.  Ignore extraneous stuff in <b>cp</b> after the end of the time
1677  * string, unless <b>strict</b> is set. */
1678 int
1679 parse_iso_time_(const char *cp, time_t *t, int strict)
1680 {
1681   struct tm st_tm;
1682   unsigned int year=0, month=0, day=0, hour=0, minute=0, second=0;
1683   int n_fields;
1684   char extra_char;
1685   n_fields = tor_sscanf(cp, "%u-%2u-%2u %2u:%2u:%2u%c", &year, &month,
1686                         &day, &hour, &minute, &second, &extra_char);
1687   if (strict ? (n_fields != 6) : (n_fields < 6)) {
1688     char *esc = esc_for_log(cp);
1689     log_warn(LD_GENERAL, "ISO time %s was unparseable", esc);
1690     tor_free(esc);
1691     return -1;
1692   }
1693   if (year < 1970 || month < 1 || month > 12 || day < 1 || day > 31 ||
1694           hour > 23 || minute > 59 || second > 60 || year >= INT32_MAX) {
1695     char *esc = esc_for_log(cp);
1696     log_warn(LD_GENERAL, "ISO time %s was nonsensical", esc);
1697     tor_free(esc);
1698     return -1;
1699   }
1700   st_tm.tm_year = (int)year-1900;
1701   st_tm.tm_mon = month-1;
1702   st_tm.tm_mday = day;
1703   st_tm.tm_hour = hour;
1704   st_tm.tm_min = minute;
1705   st_tm.tm_sec = second;
1706
1707   if (st_tm.tm_year < 70) {
1708     char *esc = esc_for_log(cp);
1709     log_warn(LD_GENERAL, "Got invalid ISO time %s. (Before 1970)", esc);
1710     tor_free(esc);
1711     return -1;
1712   }
1713   return tor_timegm(&st_tm, t);
1714 }
1715
1716 /** Given an ISO-formatted UTC time value (after the epoch) in <b>cp</b>,
1717  * parse it and store its value in *<b>t</b>.  Return 0 on success, -1 on
1718  * failure. Reject the string if any characters are present after the time.
1719  */
1720 int
1721 parse_iso_time(const char *cp, time_t *t)
1722 {
1723   return parse_iso_time_(cp, t, 1);
1724 }
1725
1726 /** Given a <b>date</b> in one of the three formats allowed by HTTP (ugh),
1727  * parse it into <b>tm</b>.  Return 0 on success, negative on failure. */
1728 int
1729 parse_http_time(const char *date, struct tm *tm)
1730 {
1731   const char *cp;
1732   char month[4];
1733   char wkday[4];
1734   int i;
1735   unsigned tm_mday, tm_year, tm_hour, tm_min, tm_sec;
1736
1737   tor_assert(tm);
1738   memset(tm, 0, sizeof(*tm));
1739
1740   /* First, try RFC1123 or RFC850 format: skip the weekday.  */
1741   if ((cp = strchr(date, ','))) {
1742     ++cp;
1743     if (*cp != ' ')
1744       return -1;
1745     ++cp;
1746     if (tor_sscanf(cp, "%2u %3s %4u %2u:%2u:%2u GMT",
1747                &tm_mday, month, &tm_year,
1748                &tm_hour, &tm_min, &tm_sec) == 6) {
1749       /* rfc1123-date */
1750       tm_year -= 1900;
1751     } else if (tor_sscanf(cp, "%2u-%3s-%2u %2u:%2u:%2u GMT",
1752                       &tm_mday, month, &tm_year,
1753                       &tm_hour, &tm_min, &tm_sec) == 6) {
1754       /* rfc850-date */
1755     } else {
1756       return -1;
1757     }
1758   } else {
1759     /* No comma; possibly asctime() format. */
1760     if (tor_sscanf(date, "%3s %3s %2u %2u:%2u:%2u %4u",
1761                wkday, month, &tm_mday,
1762                &tm_hour, &tm_min, &tm_sec, &tm_year) == 7) {
1763       tm_year -= 1900;
1764     } else {
1765       return -1;
1766     }
1767   }
1768   tm->tm_mday = (int)tm_mday;
1769   tm->tm_year = (int)tm_year;
1770   tm->tm_hour = (int)tm_hour;
1771   tm->tm_min = (int)tm_min;
1772   tm->tm_sec = (int)tm_sec;
1773
1774   month[3] = '\0';
1775   /* Okay, now decode the month. */
1776   /* set tm->tm_mon to dummy value so the check below fails. */
1777   tm->tm_mon = -1;
1778   for (i = 0; i < 12; ++i) {
1779     if (!strcasecmp(MONTH_NAMES[i], month)) {
1780       tm->tm_mon = i;
1781     }
1782   }
1783
1784   if (tm->tm_year < 0 ||
1785       tm->tm_mon < 0  || tm->tm_mon > 11 ||
1786       tm->tm_mday < 1 || tm->tm_mday > 31 ||
1787       tm->tm_hour < 0 || tm->tm_hour > 23 ||
1788       tm->tm_min < 0  || tm->tm_min > 59 ||
1789       tm->tm_sec < 0  || tm->tm_sec > 60)
1790     return -1; /* Out of range, or bad month. */
1791
1792   return 0;
1793 }
1794
1795 /** Given an <b>interval</b> in seconds, try to write it to the
1796  * <b>out_len</b>-byte buffer in <b>out</b> in a human-readable form.
1797  * Return 0 on success, -1 on failure.
1798  */
1799 int
1800 format_time_interval(char *out, size_t out_len, long interval)
1801 {
1802   /* We only report seconds if there's no hours. */
1803   long sec = 0, min = 0, hour = 0, day = 0;
1804
1805   /* -LONG_MIN is LONG_MAX + 1, which causes signed overflow */
1806   if (interval < -LONG_MAX)
1807     interval = LONG_MAX;
1808   else if (interval < 0)
1809     interval = -interval;
1810
1811   if (interval >= 86400) {
1812     day = interval / 86400;
1813     interval %= 86400;
1814   }
1815   if (interval >= 3600) {
1816     hour = interval / 3600;
1817     interval %= 3600;
1818   }
1819   if (interval >= 60) {
1820     min = interval / 60;
1821     interval %= 60;
1822   }
1823   sec = interval;
1824
1825   if (day) {
1826     return tor_snprintf(out, out_len, "%ld days, %ld hours, %ld minutes",
1827                         day, hour, min);
1828   } else if (hour) {
1829     return tor_snprintf(out, out_len, "%ld hours, %ld minutes", hour, min);
1830   } else if (min) {
1831     return tor_snprintf(out, out_len, "%ld minutes, %ld seconds", min, sec);
1832   } else {
1833     return tor_snprintf(out, out_len, "%ld seconds", sec);
1834   }
1835 }
1836
1837 /* =====
1838  * Cached time
1839  * ===== */
1840
1841 #ifndef TIME_IS_FAST
1842 /** Cached estimate of the current time.  Updated around once per second;
1843  * may be a few seconds off if we are really busy.  This is a hack to avoid
1844  * calling time(NULL) (which not everybody has optimized) on critical paths.
1845  */
1846 static time_t cached_approx_time = 0;
1847
1848 /** Return a cached estimate of the current time from when
1849  * update_approx_time() was last called.  This is a hack to avoid calling
1850  * time(NULL) on critical paths: please do not even think of calling it
1851  * anywhere else. */
1852 time_t
1853 approx_time(void)
1854 {
1855   return cached_approx_time;
1856 }
1857
1858 /** Update the cached estimate of the current time.  This function SHOULD be
1859  * called once per second, and MUST be called before the first call to
1860  * get_approx_time. */
1861 void
1862 update_approx_time(time_t now)
1863 {
1864   cached_approx_time = now;
1865 }
1866 #endif
1867
1868 /* =====
1869  * Rate limiting
1870  * ===== */
1871
1872 /** If the rate-limiter <b>lim</b> is ready at <b>now</b>, return the number
1873  * of calls to rate_limit_is_ready (including this one!) since the last time
1874  * rate_limit_is_ready returned nonzero.  Otherwise return 0. */
1875 static int
1876 rate_limit_is_ready(ratelim_t *lim, time_t now)
1877 {
1878   if (lim->rate + lim->last_allowed <= now) {
1879     int res = lim->n_calls_since_last_time + 1;
1880     lim->last_allowed = now;
1881     lim->n_calls_since_last_time = 0;
1882     return res;
1883   } else {
1884     ++lim->n_calls_since_last_time;
1885     return 0;
1886   }
1887 }
1888
1889 /** If the rate-limiter <b>lim</b> is ready at <b>now</b>, return a newly
1890  * allocated string indicating how many messages were suppressed, suitable to
1891  * append to a log message.  Otherwise return NULL. */
1892 char *
1893 rate_limit_log(ratelim_t *lim, time_t now)
1894 {
1895   int n;
1896   if ((n = rate_limit_is_ready(lim, now))) {
1897     if (n == 1) {
1898       return tor_strdup("");
1899     } else {
1900       char *cp=NULL;
1901       tor_asprintf(&cp,
1902                    " [%d similar message(s) suppressed in last %d seconds]",
1903                    n-1, lim->rate);
1904       return cp;
1905     }
1906   } else {
1907     return NULL;
1908   }
1909 }
1910
1911 /* =====
1912  * File helpers
1913  * ===== */
1914
1915 /** Write <b>count</b> bytes from <b>buf</b> to <b>fd</b>.  <b>isSocket</b>
1916  * must be 1 if fd was returned by socket() or accept(), and 0 if fd
1917  * was returned by open().  Return the number of bytes written, or -1
1918  * on error.  Only use if fd is a blocking fd.  */
1919 ssize_t
1920 write_all(tor_socket_t fd, const char *buf, size_t count, int isSocket)
1921 {
1922   size_t written = 0;
1923   ssize_t result;
1924   tor_assert(count < SSIZE_MAX);
1925
1926   while (written != count) {
1927     if (isSocket)
1928       result = tor_socket_send(fd, buf+written, count-written, 0);
1929     else
1930       result = write((int)fd, buf+written, count-written);
1931     if (result<0)
1932       return -1;
1933     written += result;
1934   }
1935   return (ssize_t)count;
1936 }
1937
1938 /** Read from <b>fd</b> to <b>buf</b>, until we get <b>count</b> bytes
1939  * or reach the end of the file. <b>isSocket</b> must be 1 if fd
1940  * was returned by socket() or accept(), and 0 if fd was returned by
1941  * open().  Return the number of bytes read, or -1 on error. Only use
1942  * if fd is a blocking fd. */
1943 ssize_t
1944 read_all(tor_socket_t fd, char *buf, size_t count, int isSocket)
1945 {
1946   size_t numread = 0;
1947   ssize_t result;
1948
1949   if (count > SIZE_T_CEILING || count > SSIZE_MAX) {
1950     errno = EINVAL;
1951     return -1;
1952   }
1953
1954   while (numread != count) {
1955     if (isSocket)
1956       result = tor_socket_recv(fd, buf+numread, count-numread, 0);
1957     else
1958       result = read((int)fd, buf+numread, count-numread);
1959     if (result<0)
1960       return -1;
1961     else if (result == 0)
1962       break;
1963     numread += result;
1964   }
1965   return (ssize_t)numread;
1966 }
1967
1968 /*
1969  *    Filesystem operations.
1970  */
1971
1972 /** Clean up <b>name</b> so that we can use it in a call to "stat".  On Unix,
1973  * we do nothing.  On Windows, we remove a trailing slash, unless the path is
1974  * the root of a disk. */
1975 static void
1976 clean_name_for_stat(char *name)
1977 {
1978 #ifdef _WIN32
1979   size_t len = strlen(name);
1980   if (!len)
1981     return;
1982   if (name[len-1]=='\\' || name[len-1]=='/') {
1983     if (len == 1 || (len==3 && name[1]==':'))
1984       return;
1985     name[len-1]='\0';
1986   }
1987 #else
1988   (void)name;
1989 #endif
1990 }
1991
1992 /** Return:
1993  * FN_ERROR if filename can't be read, is NULL, or is zero-length,
1994  * FN_NOENT if it doesn't exist,
1995  * FN_FILE if it is a non-empty regular file, or a FIFO on unix-like systems,
1996  * FN_EMPTY for zero-byte regular files,
1997  * FN_DIR if it's a directory, and
1998  * FN_ERROR for any other file type.
1999  * On FN_ERROR and FN_NOENT, sets errno.  (errno is not set when FN_ERROR
2000  * is returned due to an unhandled file type.) */
2001 file_status_t
2002 file_status(const char *fname)
2003 {
2004   struct stat st;
2005   char *f;
2006   int r;
2007   if (!fname || strlen(fname) == 0) {
2008     return FN_ERROR;
2009   }
2010   f = tor_strdup(fname);
2011   clean_name_for_stat(f);
2012   log_debug(LD_FS, "stat()ing %s", f);
2013   r = stat(sandbox_intern_string(f), &st);
2014   tor_free(f);
2015   if (r) {
2016     if (errno == ENOENT) {
2017       return FN_NOENT;
2018     }
2019     return FN_ERROR;
2020   }
2021   if (st.st_mode & S_IFDIR) {
2022     return FN_DIR;
2023   } else if (st.st_mode & S_IFREG) {
2024     if (st.st_size > 0) {
2025       return FN_FILE;
2026     } else if (st.st_size == 0) {
2027       return FN_EMPTY;
2028     } else {
2029       return FN_ERROR;
2030     }
2031 #ifndef _WIN32
2032   } else if (st.st_mode & S_IFIFO) {
2033     return FN_FILE;
2034 #endif
2035   } else {
2036     return FN_ERROR;
2037   }
2038 }
2039
2040 /** Check whether <b>dirname</b> exists and is private.  If yes return 0.  If
2041  * it does not exist, and <b>check</b>&CPD_CREATE is set, try to create it
2042  * and return 0 on success. If it does not exist, and
2043  * <b>check</b>&CPD_CHECK, and we think we can create it, return 0.  Else
2044  * return -1.  If CPD_GROUP_OK is set, then it's okay if the directory
2045  * is group-readable, but in all cases we create the directory mode 0700.
2046  * If CPD_GROUP_READ is set, existing directory behaves as CPD_GROUP_OK and
2047  * if the directory is created it will use mode 0750 with group read
2048  * permission. Group read privileges also assume execute permission
2049  * as norm for directories. If CPD_CHECK_MODE_ONLY is set, then we don't
2050  * alter the directory permissions if they are too permissive:
2051  * we just return -1.
2052  * When effective_user is not NULL, check permissions against the given user
2053  * and its primary group.
2054  */
2055 int
2056 check_private_dir(const char *dirname, cpd_check_t check,
2057                   const char *effective_user)
2058 {
2059   int r;
2060   struct stat st;
2061   char *f;
2062 #ifndef _WIN32
2063   unsigned unwanted_bits = 0;
2064   const struct passwd *pw = NULL;
2065   uid_t running_uid;
2066   gid_t running_gid;
2067 #else
2068   (void)effective_user;
2069 #endif
2070
2071   tor_assert(dirname);
2072   f = tor_strdup(dirname);
2073   clean_name_for_stat(f);
2074   log_debug(LD_FS, "stat()ing %s", f);
2075   r = stat(sandbox_intern_string(f), &st);
2076   tor_free(f);
2077   if (r) {
2078     if (errno != ENOENT) {
2079       log_warn(LD_FS, "Directory %s cannot be read: %s", dirname,
2080                strerror(errno));
2081       return -1;
2082     }
2083     if (check & CPD_CREATE) {
2084       log_info(LD_GENERAL, "Creating directory %s", dirname);
2085 #if defined (_WIN32)
2086       r = mkdir(dirname);
2087 #else
2088       if (check & CPD_GROUP_READ) {
2089         r = mkdir(dirname, 0750);
2090       } else {
2091         r = mkdir(dirname, 0700);
2092       }
2093 #endif
2094       if (r) {
2095         log_warn(LD_FS, "Error creating directory %s: %s", dirname,
2096             strerror(errno));
2097         return -1;
2098       }
2099     } else if (!(check & CPD_CHECK)) {
2100       log_warn(LD_FS, "Directory %s does not exist.", dirname);
2101       return -1;
2102     }
2103     /* XXXX In the case where check==CPD_CHECK, we should look at the
2104      * parent directory a little harder. */
2105     return 0;
2106   }
2107   if (!(st.st_mode & S_IFDIR)) {
2108     log_warn(LD_FS, "%s is not a directory", dirname);
2109     return -1;
2110   }
2111 #ifndef _WIN32
2112   if (effective_user) {
2113     /* Look up the user and group information.
2114      * If we have a problem, bail out. */
2115     pw = tor_getpwnam(effective_user);
2116     if (pw == NULL) {
2117       log_warn(LD_CONFIG, "Error setting configured user: %s not found",
2118                effective_user);
2119       return -1;
2120     }
2121     running_uid = pw->pw_uid;
2122     running_gid = pw->pw_gid;
2123   } else {
2124     running_uid = getuid();
2125     running_gid = getgid();
2126   }
2127
2128   if (st.st_uid != running_uid) {
2129     const struct passwd *pw = NULL;
2130     char *process_ownername = NULL;
2131
2132     pw = tor_getpwuid(running_uid);
2133     process_ownername = pw ? tor_strdup(pw->pw_name) : tor_strdup("<unknown>");
2134
2135     pw = tor_getpwuid(st.st_uid);
2136
2137     log_warn(LD_FS, "%s is not owned by this user (%s, %d) but by "
2138         "%s (%d). Perhaps you are running Tor as the wrong user?",
2139                          dirname, process_ownername, (int)running_uid,
2140                          pw ? pw->pw_name : "<unknown>", (int)st.st_uid);
2141
2142     tor_free(process_ownername);
2143     return -1;
2144   }
2145   if ( (check & (CPD_GROUP_OK|CPD_GROUP_READ))
2146        && (st.st_gid != running_gid) && (st.st_gid != 0)) {
2147     struct group *gr;
2148     char *process_groupname = NULL;
2149     gr = getgrgid(running_gid);
2150     process_groupname = gr ? tor_strdup(gr->gr_name) : tor_strdup("<unknown>");
2151     gr = getgrgid(st.st_gid);
2152
2153     log_warn(LD_FS, "%s is not owned by this group (%s, %d) but by group "
2154              "%s (%d).  Are you running Tor as the wrong user?",
2155              dirname, process_groupname, (int)running_gid,
2156              gr ?  gr->gr_name : "<unknown>", (int)st.st_gid);
2157
2158     tor_free(process_groupname);
2159     return -1;
2160   }
2161   if (check & (CPD_GROUP_OK|CPD_GROUP_READ)) {
2162     unwanted_bits = 0027;
2163   } else {
2164     unwanted_bits = 0077;
2165   }
2166   if ((st.st_mode & unwanted_bits) != 0) {
2167     unsigned new_mode;
2168     if (check & CPD_CHECK_MODE_ONLY) {
2169       log_warn(LD_FS, "Permissions on directory %s are too permissive.",
2170                dirname);
2171       return -1;
2172     }
2173     log_warn(LD_FS, "Fixing permissions on directory %s", dirname);
2174     new_mode = st.st_mode;
2175     new_mode |= 0700; /* Owner should have rwx */
2176     if (check & CPD_GROUP_READ) {
2177       new_mode |= 0050; /* Group should have rx */
2178     }
2179     new_mode &= ~unwanted_bits; /* Clear the bits that we didn't want set...*/
2180     if (chmod(dirname, new_mode)) {
2181       log_warn(LD_FS, "Could not chmod directory %s: %s", dirname,
2182                strerror(errno));
2183       return -1;
2184     } else {
2185       return 0;
2186     }
2187   }
2188 #endif
2189   return 0;
2190 }
2191
2192 /** Create a file named <b>fname</b> with the contents <b>str</b>.  Overwrite
2193  * the previous <b>fname</b> if possible.  Return 0 on success, -1 on failure.
2194  *
2195  * This function replaces the old file atomically, if possible.  This
2196  * function, and all other functions in util.c that create files, create them
2197  * with mode 0600.
2198  */
2199 int
2200 write_str_to_file(const char *fname, const char *str, int bin)
2201 {
2202 #ifdef _WIN32
2203   if (!bin && strchr(str, '\r')) {
2204     log_warn(LD_BUG,
2205              "We're writing a text string that already contains a CR to %s",
2206              escaped(fname));
2207   }
2208 #endif
2209   return write_bytes_to_file(fname, str, strlen(str), bin);
2210 }
2211
2212 /** Represents a file that we're writing to, with support for atomic commit:
2213  * we can write into a temporary file, and either remove the file on
2214  * failure, or replace the original file on success. */
2215 struct open_file_t {
2216   char *tempname; /**< Name of the temporary file. */
2217   char *filename; /**< Name of the original file. */
2218   unsigned rename_on_close:1; /**< Are we using the temporary file or not? */
2219   unsigned binary:1; /**< Did we open in binary mode? */
2220   int fd; /**< fd for the open file. */
2221   FILE *stdio_file; /**< stdio wrapper for <b>fd</b>. */
2222 };
2223
2224 /** Try to start writing to the file in <b>fname</b>, passing the flags
2225  * <b>open_flags</b> to the open() syscall, creating the file (if needed) with
2226  * access value <b>mode</b>.  If the O_APPEND flag is set, we append to the
2227  * original file.  Otherwise, we open a new temporary file in the same
2228  * directory, and either replace the original or remove the temporary file
2229  * when we're done.
2230  *
2231  * Return the fd for the newly opened file, and store working data in
2232  * *<b>data_out</b>.  The caller should not close the fd manually:
2233  * instead, call finish_writing_to_file() or abort_writing_to_file().
2234  * Returns -1 on failure.
2235  *
2236  * NOTE: When not appending, the flags O_CREAT and O_TRUNC are treated
2237  * as true and the flag O_EXCL is treated as false.
2238  *
2239  * NOTE: Ordinarily, O_APPEND means "seek to the end of the file before each
2240  * write()".  We don't do that.
2241  */
2242 int
2243 start_writing_to_file(const char *fname, int open_flags, int mode,
2244                       open_file_t **data_out)
2245 {
2246   open_file_t *new_file = tor_malloc_zero(sizeof(open_file_t));
2247   const char *open_name;
2248   int append = 0;
2249
2250   tor_assert(fname);
2251   tor_assert(data_out);
2252 #if (O_BINARY != 0 && O_TEXT != 0)
2253   tor_assert((open_flags & (O_BINARY|O_TEXT)) != 0);
2254 #endif
2255   new_file->fd = -1;
2256   new_file->filename = tor_strdup(fname);
2257   if (open_flags & O_APPEND) {
2258     open_name = fname;
2259     new_file->rename_on_close = 0;
2260     append = 1;
2261     open_flags &= ~O_APPEND;
2262   } else {
2263     tor_asprintf(&new_file->tempname, "%s.tmp", fname);
2264     open_name = new_file->tempname;
2265     /* We always replace an existing temporary file if there is one. */
2266     open_flags |= O_CREAT|O_TRUNC;
2267     open_flags &= ~O_EXCL;
2268     new_file->rename_on_close = 1;
2269   }
2270 #if O_BINARY != 0
2271   if (open_flags & O_BINARY)
2272     new_file->binary = 1;
2273 #endif
2274
2275   new_file->fd = tor_open_cloexec(open_name, open_flags, mode);
2276   if (new_file->fd < 0) {
2277     log_warn(LD_FS, "Couldn't open \"%s\" (%s) for writing: %s",
2278         open_name, fname, strerror(errno));
2279     goto err;
2280   }
2281   if (append) {
2282     if (tor_fd_seekend(new_file->fd) < 0) {
2283       log_warn(LD_FS, "Couldn't seek to end of file \"%s\": %s", open_name,
2284                strerror(errno));
2285       goto err;
2286     }
2287   }
2288
2289   *data_out = new_file;
2290
2291   return new_file->fd;
2292
2293  err:
2294   if (new_file->fd >= 0)
2295     close(new_file->fd);
2296   *data_out = NULL;
2297   tor_free(new_file->filename);
2298   tor_free(new_file->tempname);
2299   tor_free(new_file);
2300   return -1;
2301 }
2302
2303 /** Given <b>file_data</b> from start_writing_to_file(), return a stdio FILE*
2304  * that can be used to write to the same file.  The caller should not mix
2305  * stdio calls with non-stdio calls. */
2306 FILE *
2307 fdopen_file(open_file_t *file_data)
2308 {
2309   tor_assert(file_data);
2310   if (file_data->stdio_file)
2311     return file_data->stdio_file;
2312   tor_assert(file_data->fd >= 0);
2313   if (!(file_data->stdio_file = fdopen(file_data->fd,
2314                                        file_data->binary?"ab":"a"))) {
2315     log_warn(LD_FS, "Couldn't fdopen \"%s\" [%d]: %s", file_data->filename,
2316              file_data->fd, strerror(errno));
2317   }
2318   return file_data->stdio_file;
2319 }
2320
2321 /** Combines start_writing_to_file with fdopen_file(): arguments are as
2322  * for start_writing_to_file, but  */
2323 FILE *
2324 start_writing_to_stdio_file(const char *fname, int open_flags, int mode,
2325                             open_file_t **data_out)
2326 {
2327   FILE *res;
2328   if (start_writing_to_file(fname, open_flags, mode, data_out)<0)
2329     return NULL;
2330   if (!(res = fdopen_file(*data_out))) {
2331     abort_writing_to_file(*data_out);
2332     *data_out = NULL;
2333   }
2334   return res;
2335 }
2336
2337 /** Helper function: close and free the underlying file and memory in
2338  * <b>file_data</b>.  If we were writing into a temporary file, then delete
2339  * that file (if abort_write is true) or replaces the target file with
2340  * the temporary file (if abort_write is false). */
2341 static int
2342 finish_writing_to_file_impl(open_file_t *file_data, int abort_write)
2343 {
2344   int r = 0;
2345
2346   tor_assert(file_data && file_data->filename);
2347   if (file_data->stdio_file) {
2348     if (fclose(file_data->stdio_file)) {
2349       log_warn(LD_FS, "Error closing \"%s\": %s", file_data->filename,
2350                strerror(errno));
2351       abort_write = r = -1;
2352     }
2353   } else if (file_data->fd >= 0 && close(file_data->fd) < 0) {
2354     log_warn(LD_FS, "Error flushing \"%s\": %s", file_data->filename,
2355              strerror(errno));
2356     abort_write = r = -1;
2357   }
2358
2359   if (file_data->rename_on_close) {
2360     tor_assert(file_data->tempname && file_data->filename);
2361     if (abort_write) {
2362       int res = unlink(file_data->tempname);
2363       if (res != 0) {
2364         /* We couldn't unlink and we'll leave a mess behind */
2365         log_warn(LD_FS, "Failed to unlink %s: %s",
2366                  file_data->tempname, strerror(errno));
2367         r = -1;
2368       }
2369     } else {
2370       tor_assert(strcmp(file_data->filename, file_data->tempname));
2371       if (replace_file(file_data->tempname, file_data->filename)) {
2372         log_warn(LD_FS, "Error replacing \"%s\": %s", file_data->filename,
2373                  strerror(errno));
2374         r = -1;
2375       }
2376     }
2377   }
2378
2379   tor_free(file_data->filename);
2380   tor_free(file_data->tempname);
2381   tor_free(file_data);
2382
2383   return r;
2384 }
2385
2386 /** Finish writing to <b>file_data</b>: close the file handle, free memory as
2387  * needed, and if using a temporary file, replace the original file with
2388  * the temporary file. */
2389 int
2390 finish_writing_to_file(open_file_t *file_data)
2391 {
2392   return finish_writing_to_file_impl(file_data, 0);
2393 }
2394
2395 /** Finish writing to <b>file_data</b>: close the file handle, free memory as
2396  * needed, and if using a temporary file, delete it. */
2397 int
2398 abort_writing_to_file(open_file_t *file_data)
2399 {
2400   return finish_writing_to_file_impl(file_data, 1);
2401 }
2402
2403 /** Helper: given a set of flags as passed to open(2), open the file
2404  * <b>fname</b> and write all the sized_chunk_t structs in <b>chunks</b> to
2405  * the file.  Do so as atomically as possible e.g. by opening temp files and
2406  * renaming. */
2407 static int
2408 write_chunks_to_file_impl(const char *fname, const smartlist_t *chunks,
2409                           int open_flags)
2410 {
2411   open_file_t *file = NULL;
2412   int fd;
2413   ssize_t result;
2414   fd = start_writing_to_file(fname, open_flags, 0600, &file);
2415   if (fd<0)
2416     return -1;
2417   SMARTLIST_FOREACH(chunks, sized_chunk_t *, chunk,
2418   {
2419     result = write_all(fd, chunk->bytes, chunk->len, 0);
2420     if (result < 0) {
2421       log_warn(LD_FS, "Error writing to \"%s\": %s", fname,
2422           strerror(errno));
2423       goto err;
2424     }
2425     tor_assert((size_t)result == chunk->len);
2426   });
2427
2428   return finish_writing_to_file(file);
2429  err:
2430   abort_writing_to_file(file);
2431   return -1;
2432 }
2433
2434 /** Given a smartlist of sized_chunk_t, write them to a file
2435  * <b>fname</b>, overwriting or creating the file as necessary.
2436  * If <b>no_tempfile</b> is 0 then the file will be written
2437  * atomically. */
2438 int
2439 write_chunks_to_file(const char *fname, const smartlist_t *chunks, int bin,
2440                      int no_tempfile)
2441 {
2442   int flags = OPEN_FLAGS_REPLACE|(bin?O_BINARY:O_TEXT);
2443
2444   if (no_tempfile) {
2445     /* O_APPEND stops write_chunks_to_file from using tempfiles */
2446     flags |= O_APPEND;
2447   }
2448   return write_chunks_to_file_impl(fname, chunks, flags);
2449 }
2450
2451 /** Write <b>len</b> bytes, starting at <b>str</b>, to <b>fname</b>
2452     using the open() flags passed in <b>flags</b>. */
2453 static int
2454 write_bytes_to_file_impl(const char *fname, const char *str, size_t len,
2455                          int flags)
2456 {
2457   int r;
2458   sized_chunk_t c = { str, len };
2459   smartlist_t *chunks = smartlist_new();
2460   smartlist_add(chunks, &c);
2461   r = write_chunks_to_file_impl(fname, chunks, flags);
2462   smartlist_free(chunks);
2463   return r;
2464 }
2465
2466 /** As write_str_to_file, but does not assume a NUL-terminated
2467  * string. Instead, we write <b>len</b> bytes, starting at <b>str</b>. */
2468 MOCK_IMPL(int,
2469 write_bytes_to_file,(const char *fname, const char *str, size_t len,
2470                      int bin))
2471 {
2472   return write_bytes_to_file_impl(fname, str, len,
2473                                   OPEN_FLAGS_REPLACE|(bin?O_BINARY:O_TEXT));
2474 }
2475
2476 /** As write_bytes_to_file, but if the file already exists, append the bytes
2477  * to the end of the file instead of overwriting it. */
2478 int
2479 append_bytes_to_file(const char *fname, const char *str, size_t len,
2480                      int bin)
2481 {
2482   return write_bytes_to_file_impl(fname, str, len,
2483                                   OPEN_FLAGS_APPEND|(bin?O_BINARY:O_TEXT));
2484 }
2485
2486 /** Like write_str_to_file(), but also return -1 if there was a file
2487     already residing in <b>fname</b>. */
2488 int
2489 write_bytes_to_new_file(const char *fname, const char *str, size_t len,
2490                         int bin)
2491 {
2492   return write_bytes_to_file_impl(fname, str, len,
2493                                   OPEN_FLAGS_DONT_REPLACE|
2494                                   (bin?O_BINARY:O_TEXT));
2495 }
2496
2497 /**
2498  * Read the contents of the open file <b>fd</b> presuming it is a FIFO
2499  * (or similar) file descriptor for which the size of the file isn't
2500  * known ahead of time. Return NULL on failure, and a NUL-terminated
2501  * string on success.  On success, set <b>sz_out</b> to the number of
2502  * bytes read.
2503  */
2504 char *
2505 read_file_to_str_until_eof(int fd, size_t max_bytes_to_read, size_t *sz_out)
2506 {
2507   ssize_t r;
2508   size_t pos = 0;
2509   char *string = NULL;
2510   size_t string_max = 0;
2511
2512   if (max_bytes_to_read+1 >= SIZE_T_CEILING) {
2513     errno = EINVAL;
2514     return NULL;
2515   }
2516
2517   do {
2518     /* XXXX This "add 1K" approach is a little goofy; if we care about
2519      * performance here, we should be doubling.  But in practice we shouldn't
2520      * be using this function on big files anyway. */
2521     string_max = pos + 1024;
2522     if (string_max > max_bytes_to_read)
2523       string_max = max_bytes_to_read + 1;
2524     string = tor_realloc(string, string_max);
2525     r = read(fd, string + pos, string_max - pos - 1);
2526     if (r < 0) {
2527       int save_errno = errno;
2528       tor_free(string);
2529       errno = save_errno;
2530       return NULL;
2531     }
2532
2533     pos += r;
2534   } while (r > 0 && pos < max_bytes_to_read);
2535
2536   tor_assert(pos < string_max);
2537   *sz_out = pos;
2538   string[pos] = '\0';
2539   return string;
2540 }
2541
2542 /** Read the contents of <b>filename</b> into a newly allocated
2543  * string; return the string on success or NULL on failure.
2544  *
2545  * If <b>stat_out</b> is provided, store the result of stat()ing the
2546  * file into <b>stat_out</b>.
2547  *
2548  * If <b>flags</b> &amp; RFTS_BIN, open the file in binary mode.
2549  * If <b>flags</b> &amp; RFTS_IGNORE_MISSING, don't warn if the file
2550  * doesn't exist.
2551  */
2552 /*
2553  * This function <em>may</em> return an erroneous result if the file
2554  * is modified while it is running, but must not crash or overflow.
2555  * Right now, the error case occurs when the file length grows between
2556  * the call to stat and the call to read_all: the resulting string will
2557  * be truncated.
2558  */
2559 char *
2560 read_file_to_str(const char *filename, int flags, struct stat *stat_out)
2561 {
2562   int fd; /* router file */
2563   struct stat statbuf;
2564   char *string;
2565   ssize_t r;
2566   int bin = flags & RFTS_BIN;
2567
2568   tor_assert(filename);
2569
2570   fd = tor_open_cloexec(filename,O_RDONLY|(bin?O_BINARY:O_TEXT),0);
2571   if (fd<0) {
2572     int severity = LOG_WARN;
2573     int save_errno = errno;
2574     if (errno == ENOENT && (flags & RFTS_IGNORE_MISSING))
2575       severity = LOG_INFO;
2576     log_fn(severity, LD_FS,"Could not open \"%s\": %s",filename,
2577            strerror(errno));
2578     errno = save_errno;
2579     return NULL;
2580   }
2581
2582   if (fstat(fd, &statbuf)<0) {
2583     int save_errno = errno;
2584     close(fd);
2585     log_warn(LD_FS,"Could not fstat \"%s\".",filename);
2586     errno = save_errno;
2587     return NULL;
2588   }
2589
2590 #ifndef _WIN32
2591 /** When we detect that we're reading from a FIFO, don't read more than
2592  * this many bytes.  It's insane overkill for most uses. */
2593 #define FIFO_READ_MAX (1024*1024)
2594   if (S_ISFIFO(statbuf.st_mode)) {
2595     size_t sz = 0;
2596     string = read_file_to_str_until_eof(fd, FIFO_READ_MAX, &sz);
2597     int save_errno = errno;
2598     if (string && stat_out) {
2599       statbuf.st_size = sz;
2600       memcpy(stat_out, &statbuf, sizeof(struct stat));
2601     }
2602     close(fd);
2603     if (!string)
2604       errno = save_errno;
2605     return string;
2606   }
2607 #endif
2608
2609   if ((uint64_t)(statbuf.st_size)+1 >= SIZE_T_CEILING) {
2610     close(fd);
2611     errno = EINVAL;
2612     return NULL;
2613   }
2614
2615   string = tor_malloc((size_t)(statbuf.st_size+1));
2616
2617   r = read_all(fd,string,(size_t)statbuf.st_size,0);
2618   if (r<0) {
2619     int save_errno = errno;
2620     log_warn(LD_FS,"Error reading from file \"%s\": %s", filename,
2621              strerror(errno));
2622     tor_free(string);
2623     close(fd);
2624     errno = save_errno;
2625     return NULL;
2626   }
2627   string[r] = '\0'; /* NUL-terminate the result. */
2628
2629 #if defined(_WIN32) || defined(__CYGWIN__)
2630   if (!bin && strchr(string, '\r')) {
2631     log_debug(LD_FS, "We didn't convert CRLF to LF as well as we hoped "
2632               "when reading %s. Coping.",
2633               filename);
2634     tor_strstrip(string, "\r");
2635     r = strlen(string);
2636   }
2637   if (!bin) {
2638     statbuf.st_size = (size_t) r;
2639   } else
2640 #endif
2641     if (r != statbuf.st_size) {
2642       /* Unless we're using text mode on win32, we'd better have an exact
2643        * match for size. */
2644       int save_errno = errno;
2645       log_warn(LD_FS,"Could read only %d of %ld bytes of file \"%s\".",
2646                (int)r, (long)statbuf.st_size,filename);
2647       tor_free(string);
2648       close(fd);
2649       errno = save_errno;
2650       return NULL;
2651     }
2652   close(fd);
2653   if (stat_out) {
2654     memcpy(stat_out, &statbuf, sizeof(struct stat));
2655   }
2656
2657   return string;
2658 }
2659
2660 #define TOR_ISODIGIT(c) ('0' <= (c) && (c) <= '7')
2661
2662 /** Given a c-style double-quoted escaped string in <b>s</b>, extract and
2663  * decode its contents into a newly allocated string.  On success, assign this
2664  * string to *<b>result</b>, assign its length to <b>size_out</b> (if
2665  * provided), and return a pointer to the position in <b>s</b> immediately
2666  * after the string.  On failure, return NULL.
2667  */
2668 static const char *
2669 unescape_string(const char *s, char **result, size_t *size_out)
2670 {
2671   const char *cp;
2672   char *out;
2673   if (s[0] != '\"')
2674     return NULL;
2675   cp = s+1;
2676   while (1) {
2677     switch (*cp) {
2678       case '\0':
2679       case '\n':
2680         return NULL;
2681       case '\"':
2682         goto end_of_loop;
2683       case '\\':
2684         if (cp[1] == 'x' || cp[1] == 'X') {
2685           if (!(TOR_ISXDIGIT(cp[2]) && TOR_ISXDIGIT(cp[3])))
2686             return NULL;
2687           cp += 4;
2688         } else if (TOR_ISODIGIT(cp[1])) {
2689           cp += 2;
2690           if (TOR_ISODIGIT(*cp)) ++cp;
2691           if (TOR_ISODIGIT(*cp)) ++cp;
2692         } else if (cp[1] == 'n' || cp[1] == 'r' || cp[1] == 't' || cp[1] == '"'
2693                    || cp[1] == '\\' || cp[1] == '\'') {
2694           cp += 2;
2695         } else {
2696           return NULL;
2697         }
2698         break;
2699       default:
2700         ++cp;
2701         break;
2702     }
2703   }
2704  end_of_loop:
2705   out = *result = tor_malloc(cp-s + 1);
2706   cp = s+1;
2707   while (1) {
2708     switch (*cp)
2709       {
2710       case '\"':
2711         *out = '\0';
2712         if (size_out) *size_out = out - *result;
2713         return cp+1;
2714       case '\0':
2715         tor_fragile_assert();
2716         tor_free(*result);
2717         return NULL;
2718       case '\\':
2719         switch (cp[1])
2720           {
2721           case 'n': *out++ = '\n'; cp += 2; break;
2722           case 'r': *out++ = '\r'; cp += 2; break;
2723           case 't': *out++ = '\t'; cp += 2; break;
2724           case 'x': case 'X':
2725             {
2726               int x1, x2;
2727
2728               x1 = hex_decode_digit(cp[2]);
2729               x2 = hex_decode_digit(cp[3]);
2730               if (x1 == -1 || x2 == -1) {
2731                   tor_free(*result);
2732                   return NULL;
2733               }
2734
2735               *out++ = ((x1<<4) + x2);
2736               cp += 4;
2737             }
2738             break;
2739           case '0': case '1': case '2': case '3': case '4': case '5':
2740           case '6': case '7':
2741             {
2742               int n = cp[1]-'0';
2743               cp += 2;
2744               if (TOR_ISODIGIT(*cp)) { n = n*8 + *cp-'0'; cp++; }
2745               if (TOR_ISODIGIT(*cp)) { n = n*8 + *cp-'0'; cp++; }
2746               if (n > 255) { tor_free(*result); return NULL; }
2747               *out++ = (char)n;
2748             }
2749             break;
2750           case '\'':
2751           case '\"':
2752           case '\\':
2753           case '\?':
2754             *out++ = cp[1];
2755             cp += 2;
2756             break;
2757           default:
2758             tor_free(*result); return NULL;
2759           }
2760         break;
2761       default:
2762         *out++ = *cp++;
2763       }
2764   }
2765 }
2766
2767 /** Given a string containing part of a configuration file or similar format,
2768  * advance past comments and whitespace and try to parse a single line.  If we
2769  * parse a line successfully, set *<b>key_out</b> to a new string holding the
2770  * key portion and *<b>value_out</b> to a new string holding the value portion
2771  * of the line, and return a pointer to the start of the next line.  If we run
2772  * out of data, return a pointer to the end of the string.  If we encounter an
2773  * error, return NULL and set *<b>err_out</b> (if provided) to an error
2774  * message.
2775  */
2776 const char *
2777 parse_config_line_from_str_verbose(const char *line, char **key_out,
2778                                    char **value_out,
2779                                    const char **err_out)
2780 {
2781   /*
2782     See torrc_format.txt for a description of the (silly) format this parses.
2783    */
2784   const char *key, *val, *cp;
2785   int continuation = 0;
2786
2787   tor_assert(key_out);
2788   tor_assert(value_out);
2789
2790   *key_out = *value_out = NULL;
2791   key = val = NULL;
2792   /* Skip until the first keyword. */
2793   while (1) {
2794     while (TOR_ISSPACE(*line))
2795       ++line;
2796     if (*line == '#') {
2797       while (*line && *line != '\n')
2798         ++line;
2799     } else {
2800       break;
2801     }
2802   }
2803
2804   if (!*line) { /* End of string? */
2805     *key_out = *value_out = NULL;
2806     return line;
2807   }
2808
2809   /* Skip until the next space or \ followed by newline. */
2810   key = line;
2811   while (*line && !TOR_ISSPACE(*line) && *line != '#' &&
2812          ! (line[0] == '\\' && line[1] == '\n'))
2813     ++line;
2814   *key_out = tor_strndup(key, line-key);
2815
2816   /* Skip until the value. */
2817   while (*line == ' ' || *line == '\t')
2818     ++line;
2819
2820   val = line;
2821
2822   /* Find the end of the line. */
2823   if (*line == '\"') { // XXX No continuation handling is done here
2824     if (!(line = unescape_string(line, value_out, NULL))) {
2825       if (err_out)
2826         *err_out = "Invalid escape sequence in quoted string";
2827       return NULL;
2828     }
2829     while (*line == ' ' || *line == '\t')
2830       ++line;
2831     if (*line && *line != '#' && *line != '\n') {
2832       if (err_out)
2833         *err_out = "Excess data after quoted string";
2834       return NULL;
2835     }
2836   } else {
2837     /* Look for the end of the line. */
2838     while (*line && *line != '\n' && (*line != '#' || continuation)) {
2839       if (*line == '\\' && line[1] == '\n') {
2840         continuation = 1;
2841         line += 2;
2842       } else if (*line == '#') {
2843         do {
2844           ++line;
2845         } while (*line && *line != '\n');
2846         if (*line == '\n')
2847           ++line;
2848       } else {
2849         ++line;
2850       }
2851     }
2852
2853     if (*line == '\n') {
2854       cp = line++;
2855     } else {
2856       cp = line;
2857     }
2858     /* Now back cp up to be the last nonspace character */
2859     while (cp>val && TOR_ISSPACE(*(cp-1)))
2860       --cp;
2861
2862     tor_assert(cp >= val);
2863
2864     /* Now copy out and decode the value. */
2865     *value_out = tor_strndup(val, cp-val);
2866     if (continuation) {
2867       char *v_out, *v_in;
2868       v_out = v_in = *value_out;
2869       while (*v_in) {
2870         if (*v_in == '#') {
2871           do {
2872             ++v_in;
2873           } while (*v_in && *v_in != '\n');
2874           if (*v_in == '\n')
2875             ++v_in;
2876         } else if (v_in[0] == '\\' && v_in[1] == '\n') {
2877           v_in += 2;
2878         } else {
2879           *v_out++ = *v_in++;
2880         }
2881       }
2882       *v_out = '\0';
2883     }
2884   }
2885
2886   if (*line == '#') {
2887     do {
2888       ++line;
2889     } while (*line && *line != '\n');
2890   }
2891   while (TOR_ISSPACE(*line)) ++line;
2892
2893   return line;
2894 }
2895
2896 /** Expand any homedir prefix on <b>filename</b>; return a newly allocated
2897  * string. */
2898 char *
2899 expand_filename(const char *filename)
2900 {
2901   tor_assert(filename);
2902 #ifdef _WIN32
2903   return tor_strdup(filename);
2904 #else
2905   if (*filename == '~') {
2906     char *home, *result=NULL;
2907     const char *rest;
2908
2909     if (filename[1] == '/' || filename[1] == '\0') {
2910       home = getenv("HOME");
2911       if (!home) {
2912         log_warn(LD_CONFIG, "Couldn't find $HOME environment variable while "
2913                  "expanding \"%s\"; defaulting to \"\".", filename);
2914         home = tor_strdup("");
2915       } else {
2916         home = tor_strdup(home);
2917       }
2918       rest = strlen(filename)>=2?(filename+2):"";
2919     } else {
2920 #ifdef HAVE_PWD_H
2921       char *username, *slash;
2922       slash = strchr(filename, '/');
2923       if (slash)
2924         username = tor_strndup(filename+1,slash-filename-1);
2925       else
2926         username = tor_strdup(filename+1);
2927       if (!(home = get_user_homedir(username))) {
2928         log_warn(LD_CONFIG,"Couldn't get homedir for \"%s\"",username);
2929         tor_free(username);
2930         return NULL;
2931       }
2932       tor_free(username);
2933       rest = slash ? (slash+1) : "";
2934 #else
2935       log_warn(LD_CONFIG, "Couldn't expand homedir on system without pwd.h");
2936       return tor_strdup(filename);
2937 #endif
2938     }
2939     tor_assert(home);
2940     /* Remove trailing slash. */
2941     if (strlen(home)>1 && !strcmpend(home,PATH_SEPARATOR)) {
2942       home[strlen(home)-1] = '\0';
2943     }
2944     tor_asprintf(&result,"%s"PATH_SEPARATOR"%s",home,rest);
2945     tor_free(home);
2946     return result;
2947   } else {
2948     return tor_strdup(filename);
2949   }
2950 #endif
2951 }
2952
2953 #define MAX_SCANF_WIDTH 9999
2954
2955 /** Helper: given an ASCII-encoded decimal digit, return its numeric value.
2956  * NOTE: requires that its input be in-bounds. */
2957 static int
2958 digit_to_num(char d)
2959 {
2960   int num = ((int)d) - (int)'0';
2961   tor_assert(num <= 9 && num >= 0);
2962   return num;
2963 }
2964
2965 /** Helper: Read an unsigned int from *<b>bufp</b> of up to <b>width</b>
2966  * characters.  (Handle arbitrary width if <b>width</b> is less than 0.)  On
2967  * success, store the result in <b>out</b>, advance bufp to the next
2968  * character, and return 0.  On failure, return -1. */
2969 static int
2970 scan_unsigned(const char **bufp, unsigned long *out, int width, int base)
2971 {
2972   unsigned long result = 0;
2973   int scanned_so_far = 0;
2974   const int hex = base==16;
2975   tor_assert(base == 10 || base == 16);
2976   if (!bufp || !*bufp || !out)
2977     return -1;
2978   if (width<0)
2979     width=MAX_SCANF_WIDTH;
2980
2981   while (**bufp && (hex?TOR_ISXDIGIT(**bufp):TOR_ISDIGIT(**bufp))
2982          && scanned_so_far < width) {
2983     int digit = hex?hex_decode_digit(*(*bufp)++):digit_to_num(*(*bufp)++);
2984     // Check for overflow beforehand, without actually causing any overflow
2985     // This preserves functionality on compilers that don't wrap overflow
2986     // (i.e. that trap or optimise away overflow)
2987     // result * base + digit > ULONG_MAX
2988     // result * base > ULONG_MAX - digit
2989     if (result > (ULONG_MAX - digit)/base)
2990       return -1; /* Processing this digit would overflow */
2991     result = result * base + digit;
2992     ++scanned_so_far;
2993   }
2994
2995   if (!scanned_so_far) /* No actual digits scanned */
2996     return -1;
2997
2998   *out = result;
2999   return 0;
3000 }
3001
3002 /** Helper: Read an signed int from *<b>bufp</b> of up to <b>width</b>
3003  * characters.  (Handle arbitrary width if <b>width</b> is less than 0.)  On
3004  * success, store the result in <b>out</b>, advance bufp to the next
3005  * character, and return 0.  On failure, return -1. */
3006 static int
3007 scan_signed(const char **bufp, long *out, int width)
3008 {
3009   int neg = 0;
3010   unsigned long result = 0;
3011
3012   if (!bufp || !*bufp || !out)
3013     return -1;
3014   if (width<0)
3015     width=MAX_SCANF_WIDTH;
3016
3017   if (**bufp == '-') {
3018     neg = 1;
3019     ++*bufp;
3020     --width;
3021   }
3022
3023   if (scan_unsigned(bufp, &result, width, 10) < 0)
3024     return -1;
3025
3026   if (neg && result > 0) {
3027     if (result > ((unsigned long)LONG_MAX) + 1)
3028       return -1; /* Underflow */
3029     // Avoid overflow on the cast to signed long when result is LONG_MIN
3030     // by subtracting 1 from the unsigned long positive value,
3031     // then, after it has been cast to signed and negated,
3032     // subtracting the original 1 (the double-subtraction is intentional).
3033     // Otherwise, the cast to signed could cause a temporary long
3034     // to equal LONG_MAX + 1, which is undefined.
3035     // We avoid underflow on the subtraction by treating -0 as positive.
3036     *out = (-(long)(result - 1)) - 1;
3037   } else {
3038     if (result > LONG_MAX)
3039       return -1; /* Overflow */
3040     *out = (long)result;
3041   }
3042
3043   return 0;
3044 }
3045
3046 /** Helper: Read a decimal-formatted double from *<b>bufp</b> of up to
3047  * <b>width</b> characters.  (Handle arbitrary width if <b>width</b> is less
3048  * than 0.)  On success, store the result in <b>out</b>, advance bufp to the
3049  * next character, and return 0.  On failure, return -1. */
3050 static int
3051 scan_double(const char **bufp, double *out, int width)
3052 {
3053   int neg = 0;
3054   double result = 0;
3055   int scanned_so_far = 0;
3056
3057   if (!bufp || !*bufp || !out)
3058     return -1;
3059   if (width<0)
3060     width=MAX_SCANF_WIDTH;
3061
3062   if (**bufp == '-') {
3063     neg = 1;
3064     ++*bufp;
3065   }
3066
3067   while (**bufp && TOR_ISDIGIT(**bufp) && scanned_so_far < width) {
3068     const int digit = digit_to_num(*(*bufp)++);
3069     result = result * 10 + digit;
3070     ++scanned_so_far;
3071   }
3072   if (**bufp == '.') {
3073     double fracval = 0, denominator = 1;
3074     ++*bufp;
3075     ++scanned_so_far;
3076     while (**bufp && TOR_ISDIGIT(**bufp) && scanned_so_far < width) {
3077       const int digit = digit_to_num(*(*bufp)++);
3078       fracval = fracval * 10 + digit;
3079       denominator *= 10;
3080       ++scanned_so_far;
3081     }
3082     result += fracval / denominator;
3083   }
3084
3085   if (!scanned_so_far) /* No actual digits scanned */
3086     return -1;
3087
3088   *out = neg ? -result : result;
3089   return 0;
3090 }
3091
3092 /** Helper: copy up to <b>width</b> non-space characters from <b>bufp</b> to
3093  * <b>out</b>.  Make sure <b>out</b> is nul-terminated. Advance <b>bufp</b>
3094  * to the next non-space character or the EOS. */
3095 static int
3096 scan_string(const char **bufp, char *out, int width)
3097 {
3098   int scanned_so_far = 0;
3099   if (!bufp || !out || width < 0)
3100     return -1;
3101   while (**bufp && ! TOR_ISSPACE(**bufp) && scanned_so_far < width) {
3102     *out++ = *(*bufp)++;
3103     ++scanned_so_far;
3104   }
3105   *out = '\0';
3106   return 0;
3107 }
3108
3109 /** Locale-independent, minimal, no-surprises scanf variant, accepting only a
3110  * restricted pattern format.  For more info on what it supports, see
3111  * tor_sscanf() documentation.  */
3112 int
3113 tor_vsscanf(const char *buf, const char *pattern, va_list ap)
3114 {
3115   int n_matched = 0;
3116
3117   while (*pattern) {
3118     if (*pattern != '%') {
3119       if (*buf == *pattern) {
3120         ++buf;
3121         ++pattern;
3122         continue;
3123       } else {
3124         return n_matched;
3125       }
3126     } else {
3127       int width = -1;
3128       int longmod = 0;
3129       ++pattern;
3130       if (TOR_ISDIGIT(*pattern)) {
3131         width = digit_to_num(*pattern++);
3132         while (TOR_ISDIGIT(*pattern)) {
3133           width *= 10;
3134           width += digit_to_num(*pattern++);
3135           if (width > MAX_SCANF_WIDTH)
3136             return -1;
3137         }
3138         if (!width) /* No zero-width things. */
3139           return -1;
3140       }
3141       if (*pattern == 'l') {
3142         longmod = 1;
3143         ++pattern;
3144       }
3145       if (*pattern == 'u' || *pattern == 'x') {
3146         unsigned long u;
3147         const int base = (*pattern == 'u') ? 10 : 16;
3148         if (!*buf)
3149           return n_matched;
3150         if (scan_unsigned(&buf, &u, width, base)<0)
3151           return n_matched;
3152         if (longmod) {
3153           unsigned long *out = va_arg(ap, unsigned long *);
3154           *out = u;
3155         } else {
3156           unsigned *out = va_arg(ap, unsigned *);
3157           if (u > UINT_MAX)
3158             return n_matched;
3159           *out = (unsigned) u;
3160         }
3161         ++pattern;
3162         ++n_matched;
3163       } else if (*pattern == 'f') {
3164         double *d = va_arg(ap, double *);
3165         if (!longmod)
3166           return -1; /* float not supported */
3167         if (!*buf)
3168           return n_matched;
3169         if (scan_double(&buf, d, width)<0)
3170           return n_matched;
3171         ++pattern;
3172         ++n_matched;
3173       } else if (*pattern == 'd') {
3174         long lng=0;
3175         if (scan_signed(&buf, &lng, width)<0)
3176           return n_matched;
3177         if (longmod) {
3178           long *out = va_arg(ap, long *);
3179           *out = lng;
3180         } else {
3181           int *out = va_arg(ap, int *);
3182           if (lng < INT_MIN || lng > INT_MAX)
3183             return n_matched;
3184           *out = (int)lng;
3185         }
3186         ++pattern;
3187         ++n_matched;
3188       } else if (*pattern == 's') {
3189         char *s = va_arg(ap, char *);
3190         if (longmod)
3191           return -1;
3192         if (width < 0)
3193           return -1;
3194         if (scan_string(&buf, s, width)<0)
3195           return n_matched;
3196         ++pattern;
3197         ++n_matched;
3198       } else if (*pattern == 'c') {
3199         char *ch = va_arg(ap, char *);
3200         if (longmod)
3201           return -1;
3202         if (width != -1)
3203           return -1;
3204         if (!*buf)
3205           return n_matched;
3206         *ch = *buf++;
3207         ++pattern;
3208         ++n_matched;
3209       } else if (*pattern == '%') {
3210         if (*buf != '%')
3211           return n_matched;
3212         if (longmod)
3213           return -1;
3214         ++buf;
3215         ++pattern;
3216       } else {
3217         return -1; /* Unrecognized pattern component. */
3218       }
3219     }
3220   }
3221
3222   return n_matched;
3223 }
3224
3225 /** Minimal sscanf replacement: parse <b>buf</b> according to <b>pattern</b>
3226  * and store the results in the corresponding argument fields.  Differs from
3227  * sscanf in that:
3228  * <ul><li>It only handles %u, %lu, %x, %lx, %[NUM]s, %d, %ld, %lf, and %c.
3229  *     <li>It only handles decimal inputs for %lf. (12.3, not 1.23e1)
3230  *     <li>It does not handle arbitrarily long widths.
3231  *     <li>Numbers do not consume any space characters.
3232  *     <li>It is locale-independent.
3233  *     <li>%u and %x do not consume any space.
3234  *     <li>It returns -1 on malformed patterns.</ul>
3235  *
3236  * (As with other locale-independent functions, we need this to parse data that
3237  * is in ASCII without worrying that the C library's locale-handling will make
3238  * miscellaneous characters look like numbers, spaces, and so on.)
3239  */
3240 int
3241 tor_sscanf(const char *buf, const char *pattern, ...)
3242 {
3243   int r;
3244   va_list ap;
3245   va_start(ap, pattern);
3246   r = tor_vsscanf(buf, pattern, ap);
3247   va_end(ap);
3248   return r;
3249 }
3250
3251 /** Append the string produced by tor_asprintf(<b>pattern</b>, <b>...</b>)
3252  * to <b>sl</b>. */
3253 void
3254 smartlist_add_asprintf(struct smartlist_t *sl, const char *pattern, ...)
3255 {
3256   va_list ap;
3257   va_start(ap, pattern);
3258   smartlist_add_vasprintf(sl, pattern, ap);
3259   va_end(ap);
3260 }
3261
3262 /** va_list-based backend of smartlist_add_asprintf. */
3263 void
3264 smartlist_add_vasprintf(struct smartlist_t *sl, const char *pattern,
3265                         va_list args)
3266 {
3267   char *str = NULL;
3268
3269   tor_vasprintf(&str, pattern, args);
3270   tor_assert(str != NULL);
3271
3272   smartlist_add(sl, str);
3273 }
3274
3275 /** Return a new list containing the filenames in the directory <b>dirname</b>.
3276  * Return NULL on error or if <b>dirname</b> is not a directory.
3277  */
3278 smartlist_t *
3279 tor_listdir(const char *dirname)
3280 {
3281   smartlist_t *result;
3282 #ifdef _WIN32
3283   char *pattern=NULL;
3284   TCHAR tpattern[MAX_PATH] = {0};
3285   char name[MAX_PATH*2+1] = {0};
3286   HANDLE handle;
3287   WIN32_FIND_DATA findData;
3288   tor_asprintf(&pattern, "%s\\*", dirname);
3289 #ifdef UNICODE
3290   mbstowcs(tpattern,pattern,MAX_PATH);
3291 #else
3292   strlcpy(tpattern, pattern, MAX_PATH);
3293 #endif
3294   if (INVALID_HANDLE_VALUE == (handle = FindFirstFile(tpattern, &findData))) {
3295     tor_free(pattern);
3296     return NULL;
3297   }
3298   result = smartlist_new();
3299   while (1) {
3300 #ifdef UNICODE
3301     wcstombs(name,findData.cFileName,MAX_PATH);
3302     name[sizeof(name)-1] = '\0';
3303 #else
3304     strlcpy(name,findData.cFileName,sizeof(name));
3305 #endif
3306     if (strcmp(name, ".") &&
3307         strcmp(name, "..")) {
3308       smartlist_add(result, tor_strdup(name));
3309     }
3310     if (!FindNextFile(handle, &findData)) {
3311       DWORD err;
3312       if ((err = GetLastError()) != ERROR_NO_MORE_FILES) {
3313         char *errstr = format_win32_error(err);
3314         log_warn(LD_FS, "Error reading directory '%s': %s", dirname, errstr);
3315         tor_free(errstr);
3316       }
3317       break;
3318     }
3319   }
3320   FindClose(handle);
3321   tor_free(pattern);
3322 #else
3323   const char *prot_dname = sandbox_intern_string(dirname);
3324   DIR *d;
3325   struct dirent *de;
3326   if (!(d = opendir(prot_dname)))
3327     return NULL;
3328
3329   result = smartlist_new();
3330   while ((de = readdir(d))) {
3331     if (!strcmp(de->d_name, ".") ||
3332         !strcmp(de->d_name, ".."))
3333       continue;
3334     smartlist_add(result, tor_strdup(de->d_name));
3335   }
3336   closedir(d);
3337 #endif
3338   return result;
3339 }
3340
3341 /** Return true iff <b>filename</b> is a relative path. */
3342 int
3343 path_is_relative(const char *filename)
3344 {
3345   if (filename && filename[0] == '/')
3346     return 0;
3347 #ifdef _WIN32
3348   else if (filename && filename[0] == '\\')
3349     return 0;
3350   else if (filename && strlen(filename)>3 && TOR_ISALPHA(filename[0]) &&
3351            filename[1] == ':' && filename[2] == '\\')
3352     return 0;
3353 #endif
3354   else
3355     return 1;
3356 }
3357
3358 /* =====
3359  * Process helpers
3360  * ===== */
3361
3362 #ifndef _WIN32
3363 /* Based on code contributed by christian grothoff */
3364 /** True iff we've called start_daemon(). */
3365 static int start_daemon_called = 0;
3366 /** True iff we've called finish_daemon(). */
3367 static int finish_daemon_called = 0;
3368 /** Socketpair used to communicate between parent and child process while
3369  * daemonizing. */
3370 static int daemon_filedes[2];
3371 /** Start putting the process into daemon mode: fork and drop all resources
3372  * except standard fds.  The parent process never returns, but stays around
3373  * until finish_daemon is called.  (Note: it's safe to call this more
3374  * than once: calls after the first are ignored.)
3375  */
3376 void
3377 start_daemon(void)
3378 {
3379   pid_t pid;
3380
3381   if (start_daemon_called)
3382     return;
3383   start_daemon_called = 1;
3384
3385   if (pipe(daemon_filedes)) {
3386     log_err(LD_GENERAL,"pipe failed; exiting. Error was %s", strerror(errno));
3387     exit(1);
3388   }
3389   pid = fork();
3390   if (pid < 0) {
3391     log_err(LD_GENERAL,"fork failed. Exiting.");
3392     exit(1);
3393   }
3394   if (pid) {  /* Parent */
3395     int ok;
3396     char c;
3397
3398     close(daemon_filedes[1]); /* we only read */
3399     ok = -1;
3400     while (0 < read(daemon_filedes[0], &c, sizeof(char))) {
3401       if (c == '.')
3402         ok = 1;
3403     }
3404     fflush(stdout);
3405     if (ok == 1)
3406       exit(0);
3407     else
3408       exit(1); /* child reported error */
3409   } else { /* Child */
3410     close(daemon_filedes[0]); /* we only write */
3411
3412     pid = setsid(); /* Detach from controlling terminal */
3413     /*
3414      * Fork one more time, so the parent (the session group leader) can exit.
3415      * This means that we, as a non-session group leader, can never regain a
3416      * controlling terminal.   This part is recommended by Stevens's
3417      * _Advanced Programming in the Unix Environment_.
3418      */
3419     if (fork() != 0) {
3420       exit(0);
3421     }
3422     set_main_thread(); /* We are now the main thread. */
3423
3424     return;
3425   }
3426 }
3427
3428 /** Finish putting the process into daemon mode: drop standard fds, and tell
3429  * the parent process to exit.  (Note: it's safe to call this more than once:
3430  * calls after the first are ignored.  Calls start_daemon first if it hasn't
3431  * been called already.)
3432  */
3433 void
3434 finish_daemon(const char *desired_cwd)
3435 {
3436   int nullfd;
3437   char c = '.';
3438   if (finish_daemon_called)
3439     return;
3440   if (!start_daemon_called)
3441     start_daemon();
3442   finish_daemon_called = 1;
3443
3444   if (!desired_cwd)
3445     desired_cwd = "/";
3446    /* Don't hold the wrong FS mounted */
3447   if (chdir(desired_cwd) < 0) {
3448     log_err(LD_GENERAL,"chdir to \"%s\" failed. Exiting.",desired_cwd);
3449     exit(1);
3450   }
3451
3452   nullfd = tor_open_cloexec("/dev/null", O_RDWR, 0);
3453   if (nullfd < 0) {
3454     log_err(LD_GENERAL,"/dev/null can't be opened. Exiting.");
3455     exit(1);
3456   }
3457   /* close fds linking to invoking terminal, but
3458    * close usual incoming fds, but redirect them somewhere
3459    * useful so the fds don't get reallocated elsewhere.
3460    */
3461   if (dup2(nullfd,0) < 0 ||
3462       dup2(nullfd,1) < 0 ||
3463       dup2(nullfd,2) < 0) {
3464     log_err(LD_GENERAL,"dup2 failed. Exiting.");
3465     exit(1);
3466   }
3467   if (nullfd > 2)
3468     close(nullfd);
3469   /* signal success */
3470   if (write(daemon_filedes[1], &c, sizeof(char)) != sizeof(char)) {
3471     log_err(LD_GENERAL,"write failed. Exiting.");
3472   }
3473   close(daemon_filedes[1]);
3474 }
3475 #else
3476 /* defined(_WIN32) */
3477 void
3478 start_daemon(void)
3479 {
3480 }
3481 void
3482 finish_daemon(const char *cp)
3483 {
3484   (void)cp;
3485 }
3486 #endif
3487
3488 /** Write the current process ID, followed by NL, into <b>filename</b>.
3489  */
3490 void
3491 write_pidfile(const char *filename)
3492 {
3493   FILE *pidfile;
3494
3495   if ((pidfile = fopen(filename, "w")) == NULL) {
3496     log_warn(LD_FS, "Unable to open \"%s\" for writing: %s", filename,
3497              strerror(errno));
3498   } else {
3499 #ifdef _WIN32
3500     fprintf(pidfile, "%d\n", (int)_getpid());
3501 #else
3502     fprintf(pidfile, "%d\n", (int)getpid());
3503 #endif
3504     fclose(pidfile);
3505   }
3506 }
3507
3508 #ifdef _WIN32
3509 HANDLE
3510 load_windows_system_library(const TCHAR *library_name)
3511 {
3512   TCHAR path[MAX_PATH];
3513   unsigned n;
3514   n = GetSystemDirectory(path, MAX_PATH);
3515   if (n == 0 || n + _tcslen(library_name) + 2 >= MAX_PATH)
3516     return 0;
3517   _tcscat(path, TEXT("\\"));
3518   _tcscat(path, library_name);
3519   return LoadLibrary(path);
3520 }
3521 #endif
3522
3523 /** Format a single argument for being put on a Windows command line.
3524  * Returns a newly allocated string */
3525 static char *
3526 format_win_cmdline_argument(const char *arg)
3527 {
3528   char *formatted_arg;
3529   char need_quotes;
3530   const char *c;
3531   int i;
3532   int bs_counter = 0;
3533   /* Backslash we can point to when one is inserted into the string */
3534   const char backslash = '\\';
3535
3536   /* Smartlist of *char */
3537   smartlist_t *arg_chars;
3538   arg_chars = smartlist_new();
3539
3540   /* Quote string if it contains whitespace or is empty */
3541   need_quotes = (strchr(arg, ' ') || strchr(arg, '\t') || '\0' == arg[0]);
3542
3543   /* Build up smartlist of *chars */
3544   for (c=arg; *c != '\0'; c++) {
3545     if ('"' == *c) {
3546       /* Double up backslashes preceding a quote */
3547       for (i=0; i<(bs_counter*2); i++)
3548         smartlist_add(arg_chars, (void*)&backslash);
3549       bs_counter = 0;
3550       /* Escape the quote */
3551       smartlist_add(arg_chars, (void*)&backslash);
3552       smartlist_add(arg_chars, (void*)c);
3553     } else if ('\\' == *c) {
3554       /* Count backslashes until we know whether to double up */
3555       bs_counter++;
3556     } else {
3557       /* Don't double up slashes preceding a non-quote */
3558       for (i=0; i<bs_counter; i++)
3559         smartlist_add(arg_chars, (void*)&backslash);
3560       bs_counter = 0;
3561       smartlist_add(arg_chars, (void*)c);
3562     }
3563   }
3564   /* Don't double up trailing backslashes */
3565   for (i=0; i<bs_counter; i++)
3566     smartlist_add(arg_chars, (void*)&backslash);
3567
3568   /* Allocate space for argument, quotes (if needed), and terminator */
3569   const size_t formatted_arg_len = smartlist_len(arg_chars) +
3570     (need_quotes ? 2 : 0) + 1;
3571   formatted_arg = tor_malloc_zero(formatted_arg_len);
3572
3573   /* Add leading quote */
3574   i=0;
3575   if (need_quotes)
3576     formatted_arg[i++] = '"';
3577
3578   /* Add characters */
3579   SMARTLIST_FOREACH(arg_chars, char*, c,
3580   {
3581     formatted_arg[i++] = *c;
3582   });
3583
3584   /* Add trailing quote */
3585   if (need_quotes)
3586     formatted_arg[i++] = '"';
3587   formatted_arg[i] = '\0';
3588
3589   smartlist_free(arg_chars);
3590   return formatted_arg;
3591 }
3592
3593 /** Format a command line for use on Windows, which takes the command as a
3594  * string rather than string array. Follows the rules from "Parsing C++
3595  * Command-Line Arguments" in MSDN. Algorithm based on list2cmdline in the
3596  * Python subprocess module. Returns a newly allocated string */
3597 char *
3598 tor_join_win_cmdline(const char *argv[])
3599 {
3600   smartlist_t *argv_list;
3601   char *joined_argv;
3602   int i;
3603
3604   /* Format each argument and put the result in a smartlist */
3605   argv_list = smartlist_new();
3606   for (i=0; argv[i] != NULL; i++) {
3607     smartlist_add(argv_list, (void *)format_win_cmdline_argument(argv[i]));
3608   }
3609
3610   /* Join the arguments with whitespace */
3611   joined_argv = smartlist_join_strings(argv_list, " ", 0, NULL);
3612
3613   /* Free the newly allocated arguments, and the smartlist */
3614   SMARTLIST_FOREACH(argv_list, char *, arg,
3615   {
3616     tor_free(arg);
3617   });
3618   smartlist_free(argv_list);
3619
3620   return joined_argv;
3621 }
3622
3623 /* As format_{hex,dex}_number_sigsafe, but takes a <b>radix</b> argument
3624  * in range 2..16 inclusive. */
3625 static int
3626 format_number_sigsafe(unsigned long x, char *buf, int buf_len,
3627                       unsigned int radix)
3628 {
3629   unsigned long tmp;
3630   int len;
3631   char *cp;
3632
3633   /* NOT tor_assert. This needs to be safe to run from within a signal handler,
3634    * and from within the 'tor_assert() has failed' code. */
3635   if (radix < 2 || radix > 16)
3636     return 0;
3637
3638   /* Count how many digits we need. */
3639   tmp = x;
3640   len = 1;
3641   while (tmp >= radix) {
3642     tmp /= radix;
3643     ++len;
3644   }
3645
3646   /* Not long enough */
3647   if (!buf || len >= buf_len)
3648     return 0;
3649
3650   cp = buf + len;
3651   *cp = '\0';
3652   do {
3653     unsigned digit = (unsigned) (x % radix);
3654     tor_assert(cp > buf);
3655     --cp;
3656     *cp = "0123456789ABCDEF"[digit];
3657     x /= radix;
3658   } while (x);
3659
3660   /* NOT tor_assert; see above. */
3661   if (cp != buf) {
3662     abort();
3663   }
3664
3665   return len;
3666 }
3667
3668 /**
3669  * Helper function to output hex numbers from within a signal handler.
3670  *
3671  * Writes the nul-terminated hexadecimal digits of <b>x</b> into a buffer
3672  * <b>buf</b> of size <b>buf_len</b>, and return the actual number of digits
3673  * written, not counting the terminal NUL.
3674  *
3675  * If there is insufficient space, write nothing and return 0.
3676  *
3677  * This accepts an unsigned int because format_helper_exit_status() needs to
3678  * call it with a signed int and an unsigned char, and since the C standard
3679  * does not guarantee that an int is wider than a char (an int must be at
3680  * least 16 bits but it is permitted for a char to be that wide as well), we
3681  * can't assume a signed int is sufficient to accomodate an unsigned char.
3682  * Thus, format_helper_exit_status() will still need to emit any require '-'
3683  * on its own.
3684  *
3685  * For most purposes, you'd want to use tor_snprintf("%x") instead of this
3686  * function; it's designed to be used in code paths where you can't call
3687  * arbitrary C functions.
3688  */
3689 int
3690 format_hex_number_sigsafe(unsigned long x, char *buf, int buf_len)
3691 {
3692   return format_number_sigsafe(x, buf, buf_len, 16);
3693 }
3694
3695 /** As format_hex_number_sigsafe, but format the number in base 10. */
3696 int
3697 format_dec_number_sigsafe(unsigned long x, char *buf, int buf_len)
3698 {
3699   return format_number_sigsafe(x, buf, buf_len, 10);
3700 }
3701
3702 #ifndef _WIN32
3703 /** Format <b>child_state</b> and <b>saved_errno</b> as a hex string placed in
3704  * <b>hex_errno</b>.  Called between fork and _exit, so must be signal-handler
3705  * safe.
3706  *
3707  * <b>hex_errno</b> must have at least HEX_ERRNO_SIZE+1 bytes available.
3708  *
3709  * The format of <b>hex_errno</b> is: "CHILD_STATE/ERRNO\n", left-padded
3710  * with spaces. CHILD_STATE indicates where
3711  * in the processs of starting the child process did the failure occur (see
3712  * CHILD_STATE_* macros for definition), and SAVED_ERRNO is the value of
3713  * errno when the failure occurred.
3714  *
3715  * On success return the number of characters added to hex_errno, not counting
3716  * the terminating NUL; return -1 on error.
3717  */
3718 STATIC int
3719 format_helper_exit_status(unsigned char child_state, int saved_errno,
3720                           char *hex_errno)
3721 {
3722   unsigned int unsigned_errno;
3723   int written, left;
3724   char *cur;
3725   size_t i;
3726   int res = -1;
3727
3728   /* Fill hex_errno with spaces, and a trailing newline (memset may
3729      not be signal handler safe, so we can't use it) */
3730   for (i = 0; i < (HEX_ERRNO_SIZE - 1); i++)
3731     hex_errno[i] = ' ';
3732   hex_errno[HEX_ERRNO_SIZE - 1] = '\n';
3733
3734   /* Convert errno to be unsigned for hex conversion */
3735   if (saved_errno < 0) {
3736     // Avoid overflow on the cast to unsigned int when result is INT_MIN
3737     // by adding 1 to the signed int negative value,
3738     // then, after it has been negated and cast to unsigned,
3739     // adding the original 1 back (the double-addition is intentional).
3740     // Otherwise, the cast to signed could cause a temporary int
3741     // to equal INT_MAX + 1, which is undefined.
3742     unsigned_errno = ((unsigned int) -(saved_errno + 1)) + 1;
3743   } else {
3744     unsigned_errno = (unsigned int) saved_errno;
3745   }
3746
3747   /*
3748    * Count how many chars of space we have left, and keep a pointer into the
3749    * current point in the buffer.
3750    */
3751   left = HEX_ERRNO_SIZE+1;
3752   cur = hex_errno;
3753
3754   /* Emit child_state */
3755   written = format_hex_number_sigsafe(child_state, cur, left);
3756
3757   if (written <= 0)
3758     goto err;
3759
3760   /* Adjust left and cur */
3761   left -= written;
3762   cur += written;
3763   if (left <= 0)
3764     goto err;
3765
3766   /* Now the '/' */
3767   *cur = '/';
3768
3769   /* Adjust left and cur */
3770   ++cur;
3771   --left;
3772   if (left <= 0)
3773     goto err;
3774
3775   /* Need minus? */
3776   if (saved_errno < 0) {
3777     *cur = '-';
3778     ++cur;
3779     --left;
3780     if (left <= 0)
3781       goto err;
3782   }
3783
3784   /* Emit unsigned_errno */
3785   written = format_hex_number_sigsafe(unsigned_errno, cur, left);
3786
3787   if (written <= 0)
3788     goto err;
3789
3790   /* Adjust left and cur */
3791   left -= written;
3792   cur += written;
3793
3794   /* Check that we have enough space left for a newline and a NUL */
3795   if (left <= 1)
3796     goto err;
3797
3798   /* Emit the newline and NUL */
3799   *cur++ = '\n';
3800   *cur++ = '\0';
3801
3802   res = (int)(cur - hex_errno - 1);
3803
3804   goto done;
3805
3806  err:
3807   /*
3808    * In error exit, just write a '\0' in the first char so whatever called
3809    * this at least won't fall off the end.
3810    */
3811   *hex_errno = '\0';
3812
3813  done:
3814   return res;
3815 }
3816 #endif
3817
3818 /* Maximum number of file descriptors, if we cannot get it via sysconf() */
3819 #define DEFAULT_MAX_FD 256
3820
3821 /** Terminate the process of <b>process_handle</b>.
3822  *  Code borrowed from Python's os.kill. */
3823 int
3824 tor_terminate_process(process_handle_t *process_handle)
3825 {
3826 #ifdef _WIN32
3827   if (tor_get_exit_code(process_handle, 0, NULL) == PROCESS_EXIT_RUNNING) {
3828     HANDLE handle = process_handle->pid.hProcess;
3829
3830     if (!TerminateProcess(handle, 0))
3831       return -1;
3832     else
3833       return 0;
3834   }
3835 #else /* Unix */
3836   if (process_handle->waitpid_cb) {
3837     /* We haven't got a waitpid yet, so we can just kill off the process. */
3838     return kill(process_handle->pid, SIGTERM);
3839   }
3840 #endif
3841
3842   return -1;
3843 }
3844
3845 /** Return the Process ID of <b>process_handle</b>. */
3846 int
3847 tor_process_get_pid(process_handle_t *process_handle)
3848 {
3849 #ifdef _WIN32
3850   return (int) process_handle->pid.dwProcessId;
3851 #else
3852   return (int) process_handle->pid;
3853 #endif
3854 }
3855
3856 #ifdef _WIN32
3857 HANDLE
3858 tor_process_get_stdout_pipe(process_handle_t *process_handle)
3859 {
3860   return process_handle->stdout_pipe;
3861 }
3862 #else
3863 /* DOCDOC tor_process_get_stdout_pipe */
3864 FILE *
3865 tor_process_get_stdout_pipe(process_handle_t *process_handle)
3866 {
3867   return process_handle->stdout_handle;
3868 }
3869 #endif
3870
3871 /* DOCDOC process_handle_new */
3872 static process_handle_t *
3873 process_handle_new(void)
3874 {
3875   process_handle_t *out = tor_malloc_zero(sizeof(process_handle_t));
3876
3877 #ifdef _WIN32
3878   out->stdin_pipe = INVALID_HANDLE_VALUE;
3879   out->stdout_pipe = INVALID_HANDLE_VALUE;
3880   out->stderr_pipe = INVALID_HANDLE_VALUE;
3881 #else
3882   out->stdin_pipe = -1;
3883   out->stdout_pipe = -1;
3884   out->stderr_pipe = -1;
3885 #endif
3886
3887   return out;
3888 }
3889
3890 #ifndef _WIN32
3891 /** Invoked when a process that we've launched via tor_spawn_background() has
3892  * been found to have terminated.
3893  */
3894 static void
3895 process_handle_waitpid_cb(int status, void *arg)
3896 {
3897   process_handle_t *process_handle = arg;
3898
3899   process_handle->waitpid_exit_status = status;
3900   clear_waitpid_callback(process_handle->waitpid_cb);
3901   if (process_handle->status == PROCESS_STATUS_RUNNING)
3902     process_handle->status = PROCESS_STATUS_NOTRUNNING;
3903   process_handle->waitpid_cb = 0;
3904 }
3905 #endif
3906
3907 /**
3908  * @name child-process states
3909  *
3910  * Each of these values represents a possible state that a child process can
3911  * be in.  They're used to determine what to say when telling the parent how
3912  * far along we were before failure.
3913  *
3914  * @{
3915  */
3916 #define CHILD_STATE_INIT 0
3917 #define CHILD_STATE_PIPE 1
3918 #define CHILD_STATE_MAXFD 2
3919 #define CHILD_STATE_FORK 3
3920 #define CHILD_STATE_DUPOUT 4
3921 #define CHILD_STATE_DUPERR 5
3922 #define CHILD_STATE_DUPIN 6
3923 #define CHILD_STATE_CLOSEFD 7
3924 #define CHILD_STATE_EXEC 8
3925 #define CHILD_STATE_FAILEXEC 9
3926 /** @} */
3927 /** Start a program in the background. If <b>filename</b> contains a '/', then
3928  * it will be treated as an absolute or relative path.  Otherwise, on
3929  * non-Windows systems, the system path will be searched for <b>filename</b>.
3930  * On Windows, only the current directory will be searched. Here, to search the
3931  * system path (as well as the application directory, current working
3932  * directory, and system directories), set filename to NULL.
3933  *
3934  * The strings in <b>argv</b> will be passed as the command line arguments of
3935  * the child program (following convention, argv[0] should normally be the
3936  * filename of the executable, and this must be the case if <b>filename</b> is
3937  * NULL). The last element of argv must be NULL. A handle to the child process
3938  * will be returned in process_handle (which must be non-NULL). Read
3939  * process_handle.status to find out if the process was successfully launched.
3940  * For convenience, process_handle.status is returned by this function.
3941  *
3942  * Some parts of this code are based on the POSIX subprocess module from
3943  * Python, and example code from
3944  * http://msdn.microsoft.com/en-us/library/ms682499%28v=vs.85%29.aspx.
3945  */
3946 int
3947 tor_spawn_background(const char *const filename, const char **argv,
3948                      process_environment_t *env,
3949                      process_handle_t **process_handle_out)
3950 {
3951 #ifdef _WIN32
3952   HANDLE stdout_pipe_read = NULL;
3953   HANDLE stdout_pipe_write = NULL;
3954   HANDLE stderr_pipe_read = NULL;
3955   HANDLE stderr_pipe_write = NULL;
3956   HANDLE stdin_pipe_read = NULL;
3957   HANDLE stdin_pipe_write = NULL;
3958   process_handle_t *process_handle;
3959   int status;
3960
3961   STARTUPINFOA siStartInfo;
3962   BOOL retval = FALSE;
3963
3964   SECURITY_ATTRIBUTES saAttr;
3965   char *joined_argv;
3966
3967   saAttr.nLength = sizeof(SECURITY_ATTRIBUTES);
3968   saAttr.bInheritHandle = TRUE;
3969   /* TODO: should we set explicit security attributes? (#2046, comment 5) */
3970   saAttr.lpSecurityDescriptor = NULL;
3971
3972   /* Assume failure to start process */
3973   status = PROCESS_STATUS_ERROR;
3974
3975   /* Set up pipe for stdout */
3976   if (!CreatePipe(&stdout_pipe_read, &stdout_pipe_write, &saAttr, 0)) {
3977     log_warn(LD_GENERAL,
3978       "Failed to create pipe for stdout communication with child process: %s",
3979       format_win32_error(GetLastError()));
3980     return status;
3981   }
3982   if (!SetHandleInformation(stdout_pipe_read, HANDLE_FLAG_INHERIT, 0)) {
3983     log_warn(LD_GENERAL,
3984       "Failed to configure pipe for stdout communication with child "
3985       "process: %s", format_win32_error(GetLastError()));
3986     return status;
3987   }
3988
3989   /* Set up pipe for stderr */
3990   if (!CreatePipe(&stderr_pipe_read, &stderr_pipe_write, &saAttr, 0)) {
3991     log_warn(LD_GENERAL,
3992       "Failed to create pipe for stderr communication with child process: %s",
3993       format_win32_error(GetLastError()));
3994     return status;
3995   }
3996   if (!SetHandleInformation(stderr_pipe_read, HANDLE_FLAG_INHERIT, 0)) {
3997     log_warn(LD_GENERAL,
3998       "Failed to configure pipe for stderr communication with child "
3999       "process: %s", format_win32_error(GetLastError()));
4000     return status;
4001   }
4002
4003   /* Set up pipe for stdin */
4004   if (!CreatePipe(&stdin_pipe_read, &stdin_pipe_write, &saAttr, 0)) {
4005     log_warn(LD_GENERAL,
4006       "Failed to create pipe for stdin communication with child process: %s",
4007       format_win32_error(GetLastError()));
4008     return status;
4009   }
4010   if (!SetHandleInformation(stdin_pipe_write, HANDLE_FLAG_INHERIT, 0)) {
4011     log_warn(LD_GENERAL,
4012       "Failed to configure pipe for stdin communication with child "
4013       "process: %s", format_win32_error(GetLastError()));
4014     return status;
4015   }
4016
4017   /* Create the child process */
4018
4019   /* Windows expects argv to be a whitespace delimited string, so join argv up
4020    */
4021   joined_argv = tor_join_win_cmdline(argv);
4022
4023   process_handle = process_handle_new();
4024   process_handle->status = status;
4025
4026   ZeroMemory(&(process_handle->pid), sizeof(PROCESS_INFORMATION));
4027   ZeroMemory(&siStartInfo, sizeof(STARTUPINFO));
4028   siStartInfo.cb = sizeof(STARTUPINFO);
4029   siStartInfo.hStdError = stderr_pipe_write;
4030   siStartInfo.hStdOutput = stdout_pipe_write;
4031   siStartInfo.hStdInput = stdin_pipe_read;
4032   siStartInfo.dwFlags |= STARTF_USESTDHANDLES;
4033
4034   /* Create the child process */
4035
4036   retval = CreateProcessA(filename,      // module name
4037                  joined_argv,   // command line
4038   /* TODO: should we set explicit security attributes? (#2046, comment 5) */
4039                  NULL,          // process security attributes
4040                  NULL,          // primary thread security attributes
4041                  TRUE,          // handles are inherited
4042   /*(TODO: set CREATE_NEW CONSOLE/PROCESS_GROUP to make GetExitCodeProcess()
4043    * work?) */
4044                  CREATE_NO_WINDOW,             // creation flags
4045                  (env==NULL) ? NULL : env->windows_environment_block,
4046                  NULL,          // use parent's current directory
4047                  &siStartInfo,  // STARTUPINFO pointer
4048                  &(process_handle->pid));  // receives PROCESS_INFORMATION
4049
4050   tor_free(joined_argv);
4051
4052   if (!retval) {
4053     log_warn(LD_GENERAL,
4054       "Failed to create child process %s: %s", filename?filename:argv[0],
4055       format_win32_error(GetLastError()));
4056     tor_free(process_handle);
4057   } else  {
4058     /* TODO: Close hProcess and hThread in process_handle->pid? */
4059     process_handle->stdout_pipe = stdout_pipe_read;
4060     process_handle->stderr_pipe = stderr_pipe_read;
4061     process_handle->stdin_pipe = stdin_pipe_write;
4062     status = process_handle->status = PROCESS_STATUS_RUNNING;
4063   }
4064
4065   /* TODO: Close pipes on exit */
4066   *process_handle_out = process_handle;
4067   return status;
4068 #else // _WIN32
4069   pid_t pid;
4070   int stdout_pipe[2];
4071   int stderr_pipe[2];
4072   int stdin_pipe[2];
4073   int fd, retval;
4074   ssize_t nbytes;
4075   process_handle_t *process_handle;
4076   int status;
4077
4078   const char *error_message = SPAWN_ERROR_MESSAGE;
4079   size_t error_message_length;
4080
4081   /* Represents where in the process of spawning the program is;
4082      this is used for printing out the error message */
4083   unsigned char child_state = CHILD_STATE_INIT;
4084
4085   char hex_errno[HEX_ERRNO_SIZE + 2]; /* + 1 should be sufficient actually */
4086
4087   static int max_fd = -1;
4088
4089   status = PROCESS_STATUS_ERROR;
4090
4091   /* We do the strlen here because strlen() is not signal handler safe,
4092      and we are not allowed to use unsafe functions between fork and exec */
4093   error_message_length = strlen(error_message);
4094
4095   child_state = CHILD_STATE_PIPE;
4096
4097   /* Set up pipe for redirecting stdout, stderr, and stdin of child */
4098   retval = pipe(stdout_pipe);
4099   if (-1 == retval) {
4100     log_warn(LD_GENERAL,
4101       "Failed to set up pipe for stdout communication with child process: %s",
4102        strerror(errno));
4103     return status;
4104   }
4105
4106   retval = pipe(stderr_pipe);
4107   if (-1 == retval) {
4108     log_warn(LD_GENERAL,
4109       "Failed to set up pipe for stderr communication with child process: %s",
4110       strerror(errno));
4111
4112     close(stdout_pipe[0]);
4113     close(stdout_pipe[1]);
4114
4115     return status;
4116   }
4117
4118   retval = pipe(stdin_pipe);
4119   if (-1 == retval) {
4120     log_warn(LD_GENERAL,
4121       "Failed to set up pipe for stdin communication with child process: %s",
4122        strerror(errno));
4123
4124     close(stdout_pipe[0]);
4125     close(stdout_pipe[1]);
4126     close(stderr_pipe[0]);
4127     close(stderr_pipe[1]);
4128
4129     return status;
4130   }
4131
4132   child_state = CHILD_STATE_MAXFD;
4133
4134 #ifdef _SC_OPEN_MAX
4135   if (-1 == max_fd) {
4136     max_fd = (int) sysconf(_SC_OPEN_MAX);
4137     if (max_fd == -1) {
4138       max_fd = DEFAULT_MAX_FD;
4139       log_warn(LD_GENERAL,
4140                "Cannot find maximum file descriptor, assuming %d", max_fd);
4141     }
4142   }
4143 #else
4144   max_fd = DEFAULT_MAX_FD;
4145 #endif
4146
4147   child_state = CHILD_STATE_FORK;
4148
4149   pid = fork();
4150   if (0 == pid) {
4151     /* In child */
4152
4153 #if defined(HAVE_SYS_PRCTL_H) && defined(__linux__)
4154     /* Attempt to have the kernel issue a SIGTERM if the parent
4155      * goes away. Certain attributes of the binary being execve()ed
4156      * will clear this during the execve() call, but it's better
4157      * than nothing.
4158      */
4159     prctl(PR_SET_PDEATHSIG, SIGTERM);
4160 #endif
4161
4162     child_state = CHILD_STATE_DUPOUT;
4163
4164     /* Link child stdout to the write end of the pipe */
4165     retval = dup2(stdout_pipe[1], STDOUT_FILENO);
4166     if (-1 == retval)
4167         goto error;
4168
4169     child_state = CHILD_STATE_DUPERR;
4170
4171     /* Link child stderr to the write end of the pipe */
4172     retval = dup2(stderr_pipe[1], STDERR_FILENO);
4173     if (-1 == retval)
4174         goto error;
4175
4176     child_state = CHILD_STATE_DUPIN;
4177
4178     /* Link child stdin to the read end of the pipe */
4179     retval = dup2(stdin_pipe[0], STDIN_FILENO);
4180     if (-1 == retval)
4181       goto error;
4182
4183     child_state = CHILD_STATE_CLOSEFD;
4184
4185     close(stderr_pipe[0]);
4186     close(stderr_pipe[1]);
4187     close(stdout_pipe[0]);
4188     close(stdout_pipe[1]);
4189     close(stdin_pipe[0]);
4190     close(stdin_pipe[1]);
4191
4192     /* Close all other fds, including the read end of the pipe */
4193     /* XXX: We should now be doing enough FD_CLOEXEC setting to make
4194      * this needless. */
4195     for (fd = STDERR_FILENO + 1; fd < max_fd; fd++) {
4196       close(fd);
4197     }
4198
4199     child_state = CHILD_STATE_EXEC;
4200
4201     /* Call the requested program. We need the cast because
4202        execvp doesn't define argv as const, even though it
4203        does not modify the arguments */
4204     if (env)
4205       execve(filename, (char *const *) argv, env->unixoid_environment_block);
4206     else {
4207       static char *new_env[] = { NULL };
4208       execve(filename, (char *const *) argv, new_env);
4209     }
4210
4211     /* If we got here, the exec or open(/dev/null) failed */
4212
4213     child_state = CHILD_STATE_FAILEXEC;
4214
4215   error:
4216     {
4217       /* XXX: are we leaking fds from the pipe? */
4218       int n;
4219
4220       n = format_helper_exit_status(child_state, errno, hex_errno);
4221
4222       if (n >= 0) {
4223         /* Write the error message. GCC requires that we check the return
4224            value, but there is nothing we can do if it fails */
4225         /* TODO: Don't use STDOUT, use a pipe set up just for this purpose */
4226         nbytes = write(STDOUT_FILENO, error_message, error_message_length);
4227         nbytes = write(STDOUT_FILENO, hex_errno, n);
4228       }
4229     }
4230
4231     (void) nbytes;
4232
4233     _exit(255);
4234     /* Never reached, but avoids compiler warning */
4235     return status;
4236   }
4237
4238   /* In parent */
4239
4240   if (-1 == pid) {
4241     log_warn(LD_GENERAL, "Failed to fork child process: %s", strerror(errno));
4242     close(stdin_pipe[0]);
4243     close(stdin_pipe[1]);
4244     close(stdout_pipe[0]);
4245     close(stdout_pipe[1]);
4246     close(stderr_pipe[0]);
4247     close(stderr_pipe[1]);
4248     return status;
4249   }
4250
4251   process_handle = process_handle_new();
4252   process_handle->status = status;
4253   process_handle->pid = pid;
4254
4255   /* TODO: If the child process forked but failed to exec, waitpid it */
4256
4257   /* Return read end of the pipes to caller, and close write end */
4258   process_handle->stdout_pipe = stdout_pipe[0];
4259   retval = close(stdout_pipe[1]);
4260
4261   if (-1 == retval) {
4262     log_warn(LD_GENERAL,
4263             "Failed to close write end of stdout pipe in parent process: %s",
4264             strerror(errno));
4265   }
4266
4267   process_handle->waitpid_cb = set_waitpid_callback(pid,
4268                                                     process_handle_waitpid_cb,
4269                                                     process_handle);
4270
4271   process_handle->stderr_pipe = stderr_pipe[0];
4272   retval = close(stderr_pipe[1]);
4273
4274   if (-1 == retval) {
4275     log_warn(LD_GENERAL,
4276             "Failed to close write end of stderr pipe in parent process: %s",
4277             strerror(errno));
4278   }
4279
4280   /* Return write end of the stdin pipe to caller, and close the read end */
4281   process_handle->stdin_pipe = stdin_pipe[1];
4282   retval = close(stdin_pipe[0]);
4283
4284   if (-1 == retval) {
4285     log_warn(LD_GENERAL,
4286             "Failed to close read end of stdin pipe in parent process: %s",
4287             strerror(errno));
4288   }
4289
4290   status = process_handle->status = PROCESS_STATUS_RUNNING;
4291   /* Set stdin/stdout/stderr pipes to be non-blocking */
4292   if (fcntl(process_handle->stdout_pipe, F_SETFL, O_NONBLOCK) < 0 ||
4293       fcntl(process_handle->stderr_pipe, F_SETFL, O_NONBLOCK) < 0 ||
4294       fcntl(process_handle->stdin_pipe, F_SETFL, O_NONBLOCK) < 0) {
4295     log_warn(LD_GENERAL, "Failed to set stderror/stdout/stdin pipes "
4296              "nonblocking in parent process: %s", strerror(errno));
4297   }
4298   /* Open the buffered IO streams */
4299   process_handle->stdout_handle = fdopen(process_handle->stdout_pipe, "r");
4300   process_handle->stderr_handle = fdopen(process_handle->stderr_pipe, "r");
4301   process_handle->stdin_handle = fdopen(process_handle->stdin_pipe, "r");
4302
4303   *process_handle_out = process_handle;
4304   return process_handle->status;
4305 #endif // _WIN32
4306 }
4307
4308 /** Destroy all resources allocated by the process handle in
4309  *  <b>process_handle</b>.
4310  *  If <b>also_terminate_process</b> is true, also terminate the
4311  *  process of the process handle. */
4312 MOCK_IMPL(void,
4313 tor_process_handle_destroy,(process_handle_t *process_handle,
4314                             int also_terminate_process))
4315 {
4316   if (!process_handle)
4317     return;
4318
4319   if (also_terminate_process) {
4320     if (tor_terminate_process(process_handle) < 0) {
4321       const char *errstr =
4322 #ifdef _WIN32
4323         format_win32_error(GetLastError());
4324 #else
4325         strerror(errno);
4326 #endif
4327       log_notice(LD_GENERAL, "Failed to terminate process with "
4328                  "PID '%d' ('%s').", tor_process_get_pid(process_handle),
4329                  errstr);
4330     } else {
4331       log_info(LD_GENERAL, "Terminated process with PID '%d'.",
4332                tor_process_get_pid(process_handle));
4333     }
4334   }
4335
4336   process_handle->status = PROCESS_STATUS_NOTRUNNING;
4337
4338 #ifdef _WIN32
4339   if (process_handle->stdout_pipe)
4340     CloseHandle(process_handle->stdout_pipe);
4341
4342   if (process_handle->stderr_pipe)
4343     CloseHandle(process_handle->stderr_pipe);
4344
4345   if (process_handle->stdin_pipe)
4346     CloseHandle(process_handle->stdin_pipe);
4347 #else
4348   if (process_handle->stdout_handle)
4349     fclose(process_handle->stdout_handle);
4350
4351   if (process_handle->stderr_handle)
4352     fclose(process_handle->stderr_handle);
4353
4354   if (process_handle->stdin_handle)
4355     fclose(process_handle->stdin_handle);
4356
4357   clear_waitpid_callback(process_handle->waitpid_cb);
4358 #endif
4359
4360   memset(process_handle, 0x0f, sizeof(process_handle_t));
4361   tor_free(process_handle);
4362 }
4363
4364 /** Get the exit code of a process specified by <b>process_handle</b> and store
4365  * it in <b>exit_code</b>, if set to a non-NULL value.  If <b>block</b> is set
4366  * to true, the call will block until the process has exited.  Otherwise if
4367  * the process is still running, the function will return
4368  * PROCESS_EXIT_RUNNING, and exit_code will be left unchanged. Returns
4369  * PROCESS_EXIT_EXITED if the process did exit. If there is a failure,
4370  * PROCESS_EXIT_ERROR will be returned and the contents of exit_code (if
4371  * non-NULL) will be undefined. N.B. Under *nix operating systems, this will
4372  * probably not work in Tor, because waitpid() is called in main.c to reap any
4373  * terminated child processes.*/
4374 int
4375 tor_get_exit_code(process_handle_t *process_handle,
4376                   int block, int *exit_code)
4377 {
4378 #ifdef _WIN32
4379   DWORD retval;
4380   BOOL success;
4381
4382   if (block) {
4383     /* Wait for the process to exit */
4384     retval = WaitForSingleObject(process_handle->pid.hProcess, INFINITE);
4385     if (retval != WAIT_OBJECT_0) {
4386       log_warn(LD_GENERAL, "WaitForSingleObject() failed (%d): %s",
4387               (int)retval, format_win32_error(GetLastError()));
4388       return PROCESS_EXIT_ERROR;
4389     }
4390   } else {
4391     retval = WaitForSingleObject(process_handle->pid.hProcess, 0);
4392     if (WAIT_TIMEOUT == retval) {
4393       /* Process has not exited */
4394       return PROCESS_EXIT_RUNNING;
4395     } else if (retval != WAIT_OBJECT_0) {
4396       log_warn(LD_GENERAL, "WaitForSingleObject() failed (%d): %s",
4397                (int)retval, format_win32_error(GetLastError()));
4398       return PROCESS_EXIT_ERROR;
4399     }
4400   }
4401
4402   if (exit_code != NULL) {
4403     success = GetExitCodeProcess(process_handle->pid.hProcess,
4404                                  (PDWORD)exit_code);
4405     if (!success) {
4406       log_warn(LD_GENERAL, "GetExitCodeProcess() failed: %s",
4407                format_win32_error(GetLastError()));
4408       return PROCESS_EXIT_ERROR;
4409     }
4410   }
4411 #else
4412   int stat_loc;
4413   int retval;
4414
4415   if (process_handle->waitpid_cb) {
4416     /* We haven't processed a SIGCHLD yet. */
4417     retval = waitpid(process_handle->pid, &stat_loc, block?0:WNOHANG);
4418     if (retval == process_handle->pid) {
4419       clear_waitpid_callback(process_handle->waitpid_cb);
4420       process_handle->waitpid_cb = NULL;
4421       process_handle->waitpid_exit_status = stat_loc;
4422     }
4423   } else {
4424     /* We already got a SIGCHLD for this process, and handled it. */
4425     retval = process_handle->pid;
4426     stat_loc = process_handle->waitpid_exit_status;
4427   }
4428
4429   if (!block && 0 == retval) {
4430     /* Process has not exited */
4431     return PROCESS_EXIT_RUNNING;
4432   } else if (retval != process_handle->pid) {
4433     log_warn(LD_GENERAL, "waitpid() failed for PID %d: %s",
4434              process_handle->pid, strerror(errno));
4435     return PROCESS_EXIT_ERROR;
4436   }
4437
4438   if (!WIFEXITED(stat_loc)) {
4439     log_warn(LD_GENERAL, "Process %d did not exit normally",
4440              process_handle->pid);
4441     return PROCESS_EXIT_ERROR;
4442   }
4443
4444   if (exit_code != NULL)
4445     *exit_code = WEXITSTATUS(stat_loc);
4446 #endif // _WIN32
4447
4448   return PROCESS_EXIT_EXITED;
4449 }
4450
4451 /** Helper: return the number of characters in <b>s</b> preceding the first
4452  * occurrence of <b>ch</b>. If <b>ch</b> does not occur in <b>s</b>, return
4453  * the length of <b>s</b>. Should be equivalent to strspn(s, "ch"). */
4454 static inline size_t
4455 str_num_before(const char *s, char ch)
4456 {
4457   const char *cp = strchr(s, ch);
4458   if (cp)
4459     return cp - s;
4460   else
4461     return strlen(s);
4462 }
4463
4464 /** Return non-zero iff getenv would consider <b>s1</b> and <b>s2</b>
4465  * to have the same name as strings in a process's environment. */
4466 int
4467 environment_variable_names_equal(const char *s1, const char *s2)
4468 {
4469   size_t s1_name_len = str_num_before(s1, '=');
4470   size_t s2_name_len = str_num_before(s2, '=');
4471
4472   return (s1_name_len == s2_name_len &&
4473           tor_memeq(s1, s2, s1_name_len));
4474 }
4475
4476 /** Free <b>env</b> (assuming it was produced by
4477  * process_environment_make). */
4478 void
4479 process_environment_free(process_environment_t *env)
4480 {
4481   if (env == NULL) return;
4482
4483   /* As both an optimization hack to reduce consing on Unixoid systems
4484    * and a nice way to ensure that some otherwise-Windows-specific
4485    * code will always get tested before changes to it get merged, the
4486    * strings which env->unixoid_environment_block points to are packed
4487    * into env->windows_environment_block. */
4488   tor_free(env->unixoid_environment_block);
4489   tor_free(env->windows_environment_block);
4490
4491   tor_free(env);
4492 }
4493
4494 /** Make a process_environment_t containing the environment variables
4495  * specified in <b>env_vars</b> (as C strings of the form
4496  * "NAME=VALUE"). */
4497 process_environment_t *
4498 process_environment_make(struct smartlist_t *env_vars)
4499 {
4500   process_environment_t *env = tor_malloc_zero(sizeof(process_environment_t));
4501   size_t n_env_vars = smartlist_len(env_vars);
4502   size_t i;
4503   size_t total_env_length;
4504   smartlist_t *env_vars_sorted;
4505
4506   tor_assert(n_env_vars + 1 != 0);
4507   env->unixoid_environment_block = tor_calloc(n_env_vars + 1, sizeof(char *));
4508   /* env->unixoid_environment_block is already NULL-terminated,
4509    * because we assume that NULL == 0 (and check that during compilation). */
4510
4511   total_env_length = 1; /* terminating NUL of terminating empty string */
4512   for (i = 0; i < n_env_vars; ++i) {
4513     const char *s = smartlist_get(env_vars, i);
4514     size_t slen = strlen(s);
4515
4516     tor_assert(slen + 1 != 0);
4517     tor_assert(slen + 1 < SIZE_MAX - total_env_length);
4518     total_env_length += slen + 1;
4519   }
4520
4521   env->windows_environment_block = tor_malloc_zero(total_env_length);
4522   /* env->windows_environment_block is already
4523    * (NUL-terminated-empty-string)-terminated. */
4524
4525   /* Some versions of Windows supposedly require that environment
4526    * blocks be sorted.  Or maybe some Windows programs (or their
4527    * runtime libraries) fail to look up strings in non-sorted
4528    * environment blocks.
4529    *
4530    * Also, sorting strings makes it easy to find duplicate environment
4531    * variables and environment-variable strings without an '=' on all
4532    * OSes, and they can cause badness.  Let's complain about those. */
4533   env_vars_sorted = smartlist_new();
4534   smartlist_add_all(env_vars_sorted, env_vars);
4535   smartlist_sort_strings(env_vars_sorted);
4536
4537   /* Now copy the strings into the environment blocks. */
4538   {
4539     char *cp = env->windows_environment_block;
4540     const char *prev_env_var = NULL;
4541
4542     for (i = 0; i < n_env_vars; ++i) {
4543       const char *s = smartlist_get(env_vars_sorted, i);
4544       size_t slen = strlen(s);
4545       size_t s_name_len = str_num_before(s, '=');
4546
4547       if (s_name_len == slen) {
4548         log_warn(LD_GENERAL,
4549                  "Preparing an environment containing a variable "
4550                  "without a value: %s",
4551                  s);
4552       }
4553       if (prev_env_var != NULL &&
4554           environment_variable_names_equal(s, prev_env_var)) {
4555         log_warn(LD_GENERAL,
4556                  "Preparing an environment containing two variables "
4557                  "with the same name: %s and %s",
4558                  prev_env_var, s);
4559       }
4560
4561       prev_env_var = s;
4562
4563       /* Actually copy the string into the environment. */
4564       memcpy(cp, s, slen+1);
4565       env->unixoid_environment_block[i] = cp;
4566       cp += slen+1;
4567     }
4568
4569     tor_assert(cp == env->windows_environment_block + total_env_length - 1);
4570   }
4571
4572   smartlist_free(env_vars_sorted);
4573
4574   return env;
4575 }
4576
4577 /** Return a newly allocated smartlist containing every variable in
4578  * this process's environment, as a NUL-terminated string of the form
4579  * "NAME=VALUE".  Note that on some/many/most/all OSes, the parent
4580  * process can put strings not of that form in our environment;
4581  * callers should try to not get crashed by that.
4582  *
4583  * The returned strings are heap-allocated, and must be freed by the
4584  * caller. */
4585 struct smartlist_t *
4586 get_current_process_environment_variables(void)
4587 {
4588   smartlist_t *sl = smartlist_new();
4589
4590   char **environ_tmp; /* Not const char ** ? Really? */
4591   for (environ_tmp = get_environment(); *environ_tmp; ++environ_tmp) {
4592     smartlist_add(sl, tor_strdup(*environ_tmp));
4593   }
4594
4595   return sl;
4596 }
4597
4598 /** For each string s in <b>env_vars</b> such that
4599  * environment_variable_names_equal(s, <b>new_var</b>), remove it; if
4600  * <b>free_p</b> is non-zero, call <b>free_old</b>(s).  If
4601  * <b>new_var</b> contains '=', insert it into <b>env_vars</b>. */
4602 void
4603 set_environment_variable_in_smartlist(struct smartlist_t *env_vars,
4604                                       const char *new_var,
4605                                       void (*free_old)(void*),
4606                                       int free_p)
4607 {
4608   SMARTLIST_FOREACH_BEGIN(env_vars, const char *, s) {
4609     if (environment_variable_names_equal(s, new_var)) {
4610       SMARTLIST_DEL_CURRENT(env_vars, s);
4611       if (free_p) {
4612         free_old((void *)s);
4613       }
4614     }
4615   } SMARTLIST_FOREACH_END(s);
4616
4617   if (strchr(new_var, '=') != NULL) {
4618     smartlist_add(env_vars, (void *)new_var);
4619   }
4620 }
4621
4622 #ifdef _WIN32
4623 /** Read from a handle <b>h</b> into <b>buf</b>, up to <b>count</b> bytes.  If
4624  * <b>hProcess</b> is NULL, the function will return immediately if there is
4625  * nothing more to read. Otherwise <b>hProcess</b> should be set to the handle
4626  * to the process owning the <b>h</b>. In this case, the function will exit
4627  * only once the process has exited, or <b>count</b> bytes are read. Returns
4628  * the number of bytes read, or -1 on error. */
4629 ssize_t
4630 tor_read_all_handle(HANDLE h, char *buf, size_t count,
4631                     const process_handle_t *process)
4632 {
4633   size_t numread = 0;
4634   BOOL retval;
4635   DWORD byte_count;
4636   BOOL process_exited = FALSE;
4637
4638   if (count > SIZE_T_CEILING || count > SSIZE_MAX)
4639     return -1;
4640
4641   while (numread != count) {
4642     /* Check if there is anything to read */
4643     retval = PeekNamedPipe(h, NULL, 0, NULL, &byte_count, NULL);
4644     if (!retval) {
4645       log_warn(LD_GENERAL,
4646         "Failed to peek from handle: %s",
4647         format_win32_error(GetLastError()));
4648       return -1;
4649     } else if (0 == byte_count) {
4650       /* Nothing available: process exited or it is busy */
4651
4652       /* Exit if we don't know whether the process is running */
4653       if (NULL == process)
4654         break;
4655
4656       /* The process exited and there's nothing left to read from it */
4657       if (process_exited)
4658         break;
4659
4660       /* If process is not running, check for output one more time in case
4661          it wrote something after the peek was performed. Otherwise keep on
4662          waiting for output */
4663       tor_assert(process != NULL);
4664       byte_count = WaitForSingleObject(process->pid.hProcess, 0);
4665       if (WAIT_TIMEOUT != byte_count)
4666         process_exited = TRUE;
4667
4668       continue;
4669     }
4670
4671     /* There is data to read; read it */
4672     retval = ReadFile(h, buf+numread, count-numread, &byte_count, NULL);
4673     tor_assert(byte_count + numread <= count);
4674     if (!retval) {
4675       log_warn(LD_GENERAL, "Failed to read from handle: %s",
4676         format_win32_error(GetLastError()));
4677       return -1;
4678     } else if (0 == byte_count) {
4679       /* End of file */
4680       break;
4681     }
4682     numread += byte_count;
4683   }
4684   return (ssize_t)numread;
4685 }
4686 #else
4687 /** Read from a handle <b>h</b> into <b>buf</b>, up to <b>count</b> bytes.  If
4688  * <b>process</b> is NULL, the function will return immediately if there is
4689  * nothing more to read. Otherwise data will be read until end of file, or
4690  * <b>count</b> bytes are read.  Returns the number of bytes read, or -1 on
4691  * error. Sets <b>eof</b> to true if <b>eof</b> is not NULL and the end of the
4692  * file has been reached. */
4693 ssize_t
4694 tor_read_all_handle(FILE *h, char *buf, size_t count,
4695                     const process_handle_t *process,
4696                     int *eof)
4697 {
4698   size_t numread = 0;
4699   char *retval;
4700
4701   if (eof)
4702     *eof = 0;
4703
4704   if (count > SIZE_T_CEILING || count > SSIZE_MAX)
4705     return -1;
4706
4707   while (numread != count) {
4708     /* Use fgets because that is what we use in log_from_pipe() */
4709     retval = fgets(buf+numread, (int)(count-numread), h);
4710     if (NULL == retval) {
4711       if (feof(h)) {
4712         log_debug(LD_GENERAL, "fgets() reached end of file");
4713         if (eof)
4714           *eof = 1;
4715         break;
4716       } else {
4717         if (EAGAIN == errno) {
4718           if (process)
4719             continue;
4720           else
4721             break;
4722         } else {
4723           log_warn(LD_GENERAL, "fgets() from handle failed: %s",
4724                    strerror(errno));
4725           return -1;
4726         }
4727       }
4728     }
4729     tor_assert(retval != NULL);
4730     tor_assert(strlen(retval) + numread <= count);
4731     numread += strlen(retval);
4732   }
4733
4734   log_debug(LD_GENERAL, "fgets() read %d bytes from handle", (int)numread);
4735   return (ssize_t)numread;
4736 }
4737 #endif
4738
4739 /** Read from stdout of a process until the process exits. */
4740 ssize_t
4741 tor_read_all_from_process_stdout(const process_handle_t *process_handle,
4742                                  char *buf, size_t count)
4743 {
4744 #ifdef _WIN32
4745   return tor_read_all_handle(process_handle->stdout_pipe, buf, count,
4746                              process_handle);
4747 #else
4748   return tor_read_all_handle(process_handle->stdout_handle, buf, count,
4749                              process_handle, NULL);
4750 #endif
4751 }
4752
4753 /** Read from stdout of a process until the process exits. */
4754 ssize_t
4755 tor_read_all_from_process_stderr(const process_handle_t *process_handle,
4756                                  char *buf, size_t count)
4757 {
4758 #ifdef _WIN32
4759   return tor_read_all_handle(process_handle->stderr_pipe, buf, count,
4760                              process_handle);
4761 #else
4762   return tor_read_all_handle(process_handle->stderr_handle, buf, count,
4763                              process_handle, NULL);
4764 #endif
4765 }
4766
4767 /** Split buf into lines, and add to smartlist. The buffer <b>buf</b> will be
4768  * modified. The resulting smartlist will consist of pointers to buf, so there
4769  * is no need to free the contents of sl. <b>buf</b> must be a NUL-terminated
4770  * string. <b>len</b> should be set to the length of the buffer excluding the
4771  * NUL. Non-printable characters (including NUL) will be replaced with "." */
4772 int
4773 tor_split_lines(smartlist_t *sl, char *buf, int len)
4774 {
4775   /* Index in buf of the start of the current line */
4776   int start = 0;
4777   /* Index in buf of the current character being processed */
4778   int cur = 0;
4779   /* Are we currently in a line */
4780   char in_line = 0;
4781
4782   /* Loop over string */
4783   while (cur < len) {
4784     /* Loop until end of line or end of string */
4785     for (; cur < len; cur++) {
4786       if (in_line) {
4787         if ('\r' == buf[cur] || '\n' == buf[cur]) {
4788           /* End of line */
4789           buf[cur] = '\0';
4790           /* Point cur to the next line */
4791           cur++;
4792           /* Line starts at start and ends with a nul */
4793           break;
4794         } else {
4795           if (!TOR_ISPRINT(buf[cur]))
4796             buf[cur] = '.';
4797         }
4798       } else {
4799         if ('\r' == buf[cur] || '\n' == buf[cur]) {
4800           /* Skip leading vertical space */
4801           ;
4802         } else {
4803           in_line = 1;
4804           start = cur;
4805           if (!TOR_ISPRINT(buf[cur]))
4806             buf[cur] = '.';
4807         }
4808       }
4809     }
4810     /* We are at the end of the line or end of string. If in_line is true there
4811      * is a line which starts at buf+start and ends at a NUL. cur points to
4812      * the character after the NUL. */
4813     if (in_line)
4814       smartlist_add(sl, (void *)(buf+start));
4815     in_line = 0;
4816   }
4817   return smartlist_len(sl);
4818 }
4819
4820 /** Return a string corresponding to <b>stream_status</b>. */
4821 const char *
4822 stream_status_to_string(enum stream_status stream_status)
4823 {
4824   switch (stream_status) {
4825     case IO_STREAM_OKAY:
4826       return "okay";
4827     case IO_STREAM_EAGAIN:
4828       return "temporarily unavailable";
4829     case IO_STREAM_TERM:
4830       return "terminated";
4831     case IO_STREAM_CLOSED:
4832       return "closed";
4833     default:
4834       tor_fragile_assert();
4835       return "unknown";
4836   }
4837 }
4838
4839 /* DOCDOC */
4840 static void
4841 log_portfw_spawn_error_message(const char *buf,
4842                                const char *executable, int *child_status)
4843 {
4844   /* Parse error message */
4845   int retval, child_state, saved_errno;
4846   retval = tor_sscanf(buf, SPAWN_ERROR_MESSAGE "%x/%x",
4847                       &child_state, &saved_errno);
4848   if (retval == 2) {
4849     log_warn(LD_GENERAL,
4850              "Failed to start child process \"%s\" in state %d: %s",
4851              executable, child_state, strerror(saved_errno));
4852     if (child_status)
4853       *child_status = 1;
4854   } else {
4855     /* Failed to parse message from child process, log it as a
4856        warning */
4857     log_warn(LD_GENERAL,
4858              "Unexpected message from port forwarding helper \"%s\": %s",
4859              executable, buf);
4860   }
4861 }
4862
4863 #ifdef _WIN32
4864
4865 /** Return a smartlist containing lines outputted from
4866  *  <b>handle</b>. Return NULL on error, and set
4867  *  <b>stream_status_out</b> appropriately. */
4868 MOCK_IMPL(smartlist_t *,
4869 tor_get_lines_from_handle, (HANDLE *handle,
4870                             enum stream_status *stream_status_out))
4871 {
4872   int pos;
4873   char stdout_buf[600] = {0};
4874   smartlist_t *lines = NULL;
4875
4876   tor_assert(stream_status_out);
4877
4878   *stream_status_out = IO_STREAM_TERM;
4879
4880   pos = tor_read_all_handle(handle, stdout_buf, sizeof(stdout_buf) - 1, NULL);
4881   if (pos < 0) {
4882     *stream_status_out = IO_STREAM_TERM;
4883     return NULL;
4884   }
4885   if (pos == 0) {
4886     *stream_status_out = IO_STREAM_EAGAIN;
4887     return NULL;
4888   }
4889
4890   /* End with a null even if there isn't a \r\n at the end */
4891   /* TODO: What if this is a partial line? */
4892   stdout_buf[pos] = '\0';
4893
4894   /* Split up the buffer */
4895   lines = smartlist_new();
4896   tor_split_lines(lines, stdout_buf, pos);
4897
4898   /* Currently 'lines' is populated with strings residing on the
4899      stack. Replace them with their exact copies on the heap: */
4900   SMARTLIST_FOREACH(lines, char *, line,
4901                     SMARTLIST_REPLACE_CURRENT(lines, line, tor_strdup(line)));
4902
4903   *stream_status_out = IO_STREAM_OKAY;
4904
4905   return lines;
4906 }
4907
4908 /** Read from stream, and send lines to log at the specified log level.
4909  * Returns -1 if there is a error reading, and 0 otherwise.
4910  * If the generated stream is flushed more often than on new lines, or
4911  * a read exceeds 256 bytes, lines will be truncated. This should be fixed,
4912  * along with the corresponding problem on *nix (see bug #2045).
4913  */
4914 static int
4915 log_from_handle(HANDLE *pipe, int severity)
4916 {
4917   char buf[256];
4918   int pos;
4919   smartlist_t *lines;
4920
4921   pos = tor_read_all_handle(pipe, buf, sizeof(buf) - 1, NULL);
4922   if (pos < 0) {
4923     /* Error */
4924     log_warn(LD_GENERAL, "Failed to read data from subprocess");
4925     return -1;
4926   }
4927
4928   if (0 == pos) {
4929     /* There's nothing to read (process is busy or has exited) */
4930     log_debug(LD_GENERAL, "Subprocess had nothing to say");
4931     return 0;
4932   }
4933
4934   /* End with a null even if there isn't a \r\n at the end */
4935   /* TODO: What if this is a partial line? */
4936   buf[pos] = '\0';
4937   log_debug(LD_GENERAL, "Subprocess had %d bytes to say", pos);
4938
4939   /* Split up the buffer */
4940   lines = smartlist_new();
4941   tor_split_lines(lines, buf, pos);
4942
4943   /* Log each line */
4944   SMARTLIST_FOREACH(lines, char *, line,
4945   {
4946     log_fn(severity, LD_GENERAL, "Port forwarding helper says: %s", line);
4947   });
4948   smartlist_free(lines);
4949
4950   return 0;
4951 }
4952
4953 #else
4954
4955 /** Return a smartlist containing lines outputted from
4956  *  <b>handle</b>. Return NULL on error, and set
4957  *  <b>stream_status_out</b> appropriately. */
4958 MOCK_IMPL(smartlist_t *,
4959 tor_get_lines_from_handle, (FILE *handle,
4960                             enum stream_status *stream_status_out))
4961 {
4962   enum stream_status stream_status;
4963   char stdout_buf[400];
4964   smartlist_t *lines = NULL;
4965
4966   while (1) {
4967     memset(stdout_buf, 0, sizeof(stdout_buf));
4968
4969     stream_status = get_string_from_pipe(handle,
4970                                          stdout_buf, sizeof(stdout_buf) - 1);
4971     if (stream_status != IO_STREAM_OKAY)
4972       goto done;
4973
4974     if (!lines) lines = smartlist_new();
4975     smartlist_add(lines, tor_strdup(stdout_buf));
4976   }
4977
4978  done:
4979   *stream_status_out = stream_status;
4980   return lines;
4981 }
4982
4983 /** Read from stream, and send lines to log at the specified log level.
4984  * Returns 1 if stream is closed normally, -1 if there is a error reading, and
4985  * 0 otherwise. Handles lines from tor-fw-helper and
4986  * tor_spawn_background() specially.
4987  */
4988 static int
4989 log_from_pipe(FILE *stream, int severity, const char *executable,
4990               int *child_status)
4991 {
4992   char buf[256];
4993   enum stream_status r;
4994
4995   for (;;) {
4996     r = get_string_from_pipe(stream, buf, sizeof(buf) - 1);
4997
4998     if (r == IO_STREAM_CLOSED) {
4999       return 1;
5000     } else if (r == IO_STREAM_EAGAIN) {
5001       return 0;
5002     } else if (r == IO_STREAM_TERM) {
5003       return -1;
5004     }
5005
5006     tor_assert(r == IO_STREAM_OKAY);
5007
5008     /* Check if buf starts with SPAWN_ERROR_MESSAGE */
5009     if (strcmpstart(buf, SPAWN_ERROR_MESSAGE) == 0) {
5010       log_portfw_spawn_error_message(buf, executable, child_status);
5011     } else {
5012       log_fn(severity, LD_GENERAL, "Port forwarding helper says: %s", buf);
5013     }
5014   }
5015
5016   /* We should never get here */
5017   return -1;
5018 }
5019 #endif
5020
5021 /** Reads from <b>stream</b> and stores input in <b>buf_out</b> making
5022  *  sure it's below <b>count</b> bytes.
5023  *  If the string has a trailing newline, we strip it off.
5024  *
5025  * This function is specifically created to handle input from managed
5026  * proxies, according to the pluggable transports spec. Make sure it
5027  * fits your needs before using it.
5028  *
5029  * Returns:
5030  * IO_STREAM_CLOSED: If the stream is closed.
5031  * IO_STREAM_EAGAIN: If there is nothing to read and we should check back
5032  *  later.
5033  * IO_STREAM_TERM: If something is wrong with the stream.
5034  * IO_STREAM_OKAY: If everything went okay and we got a string
5035  *  in <b>buf_out</b>. */
5036 enum stream_status
5037 get_string_from_pipe(FILE *stream, char *buf_out, size_t count)
5038 {
5039   char *retval;
5040   size_t len;
5041
5042   tor_assert(count <= INT_MAX);
5043
5044   retval = fgets(buf_out, (int)count, stream);
5045
5046   if (!retval) {
5047     if (feof(stream)) {
5048       /* Program has closed stream (probably it exited) */
5049       /* TODO: check error */
5050       return IO_STREAM_CLOSED;
5051     } else {
5052       if (EAGAIN == errno) {
5053         /* Nothing more to read, try again next time */
5054         return IO_STREAM_EAGAIN;
5055       } else {
5056         /* There was a problem, abandon this child process */
5057         return IO_STREAM_TERM;
5058       }
5059     }
5060   } else {
5061     len = strlen(buf_out);
5062     if (len == 0) {
5063       /* this probably means we got a NUL at the start of the string. */
5064       return IO_STREAM_EAGAIN;
5065     }
5066
5067     if (buf_out[len - 1] == '\n') {
5068       /* Remove the trailing newline */
5069       buf_out[len - 1] = '\0';
5070     } else {
5071       /* No newline; check whether we overflowed the buffer */
5072       if (!feof(stream))
5073         log_info(LD_GENERAL,
5074                  "Line from stream was truncated: %s", buf_out);
5075       /* TODO: What to do with this error? */
5076     }
5077
5078     return IO_STREAM_OKAY;
5079   }
5080
5081   /* We should never get here */
5082   return IO_STREAM_TERM;
5083 }
5084
5085 /** Parse a <b>line</b> from tor-fw-helper and issue an appropriate
5086  *  log message to our user. */
5087 static void
5088 handle_fw_helper_line(const char *executable, const char *line)
5089 {
5090   smartlist_t *tokens = smartlist_new();
5091   char *message = NULL;
5092   char *message_for_log = NULL;
5093   const char *external_port = NULL;
5094   const char *internal_port = NULL;
5095   const char *result = NULL;
5096   int port = 0;
5097   int success = 0;
5098
5099   if (strcmpstart(line, SPAWN_ERROR_MESSAGE) == 0) {
5100     /* We need to check for SPAWN_ERROR_MESSAGE again here, since it's
5101      * possible that it got sent after we tried to read it in log_from_pipe.
5102      *
5103      * XXX Ideally, we should be using one of stdout/stderr for the real
5104      * output, and one for the output of the startup code.  We used to do that
5105      * before cd05f35d2c.
5106      */
5107     int child_status;
5108     log_portfw_spawn_error_message(line, executable, &child_status);
5109     goto done;
5110   }
5111
5112   smartlist_split_string(tokens, line, NULL,
5113                          SPLIT_SKIP_SPACE|SPLIT_IGNORE_BLANK, -1);
5114
5115   if (smartlist_len(tokens) < 5)
5116     goto err;
5117
5118   if (strcmp(smartlist_get(tokens, 0), "tor-fw-helper") ||
5119       strcmp(smartlist_get(tokens, 1), "tcp-forward"))
5120     goto err;
5121
5122   external_port = smartlist_get(tokens, 2);
5123   internal_port = smartlist_get(tokens, 3);
5124   result = smartlist_get(tokens, 4);
5125
5126   if (smartlist_len(tokens) > 5) {
5127     /* If there are more than 5 tokens, they are part of [<message>].
5128        Let's use a second smartlist to form the whole message;
5129        strncat loops suck. */
5130     int i;
5131     int message_words_n = smartlist_len(tokens) - 5;
5132     smartlist_t *message_sl = smartlist_new();
5133     for (i = 0; i < message_words_n; i++)
5134       smartlist_add(message_sl, smartlist_get(tokens, 5+i));
5135
5136     tor_assert(smartlist_len(message_sl) > 0);
5137     message = smartlist_join_strings(message_sl, " ", 0, NULL);
5138
5139     /* wrap the message in log-friendly wrapping */
5140     tor_asprintf(&message_for_log, " ('%s')", message);
5141
5142     smartlist_free(message_sl);
5143   }
5144
5145   port = atoi(external_port);
5146   if (port < 1 || port > 65535)
5147     goto err;
5148
5149   port = atoi(internal_port);
5150   if (port < 1 || port > 65535)
5151     goto err;
5152
5153   if (!strcmp(result, "SUCCESS"))
5154     success = 1;
5155   else if (!strcmp(result, "FAIL"))
5156     success = 0;
5157   else
5158     goto err;
5159
5160   if (!success) {
5161     log_warn(LD_GENERAL, "Tor was unable to forward TCP port '%s' to '%s'%s. "
5162              "Please make sure that your router supports port "
5163              "forwarding protocols (like NAT-PMP). Note that if '%s' is "
5164              "your ORPort, your relay will be unable to receive inbound "
5165              "traffic.", external_port, internal_port,
5166              message_for_log ? message_for_log : "",
5167              internal_port);
5168   } else {
5169     log_info(LD_GENERAL,
5170              "Tor successfully forwarded TCP port '%s' to '%s'%s.",
5171              external_port, internal_port,
5172              message_for_log ? message_for_log : "");
5173   }
5174
5175   goto done;
5176
5177  err:
5178   log_warn(LD_GENERAL, "tor-fw-helper sent us a string we could not "
5179            "parse (%s).", line);
5180
5181  done:
5182   SMARTLIST_FOREACH(tokens, char *, cp, tor_free(cp));
5183   smartlist_free(tokens);
5184   tor_free(message);
5185   tor_free(message_for_log);
5186 }
5187
5188 /** Read what tor-fw-helper has to say in its stdout and handle it
5189  *  appropriately */
5190 static int
5191 handle_fw_helper_output(const char *executable,
5192                         process_handle_t *process_handle)
5193 {
5194   smartlist_t *fw_helper_output = NULL;
5195   enum stream_status stream_status = 0;
5196
5197   fw_helper_output =
5198     tor_get_lines_from_handle(tor_process_get_stdout_pipe(process_handle),
5199                               &stream_status);
5200   if (!fw_helper_output) { /* didn't get any output from tor-fw-helper */
5201     /* if EAGAIN we should retry in the future */
5202     return (stream_status == IO_STREAM_EAGAIN) ? 0 : -1;
5203   }
5204
5205   /* Handle the lines we got: */
5206   SMARTLIST_FOREACH_BEGIN(fw_helper_output, char *, line) {
5207     handle_fw_helper_line(executable, line);
5208     tor_free(line);
5209   } SMARTLIST_FOREACH_END(line);
5210
5211   smartlist_free(fw_helper_output);
5212
5213   return 0;
5214 }
5215
5216 /** Spawn tor-fw-helper and ask it to forward the ports in
5217  *  <b>ports_to_forward</b>. <b>ports_to_forward</b> contains strings
5218  *  of the form "<external port>:<internal port>", which is the format
5219  *  that tor-fw-helper expects. */
5220 void
5221 tor_check_port_forwarding(const char *filename,
5222                           smartlist_t *ports_to_forward,
5223                           time_t now)
5224 {
5225 /* When fw-helper succeeds, how long do we wait until running it again */
5226 #define TIME_TO_EXEC_FWHELPER_SUCCESS 300
5227 /* When fw-helper failed to start, how long do we wait until running it again
5228  */
5229 #define TIME_TO_EXEC_FWHELPER_FAIL 60
5230
5231   /* Static variables are initialized to zero, so child_handle.status=0
5232    * which corresponds to it not running on startup */
5233   static process_handle_t *child_handle=NULL;
5234
5235   static time_t time_to_run_helper = 0;
5236   int stderr_status, retval;
5237   int stdout_status = 0;
5238
5239   tor_assert(filename);
5240
5241   /* Start the child, if it is not already running */
5242   if ((!child_handle || child_handle->status != PROCESS_STATUS_RUNNING) &&
5243       time_to_run_helper < now) {
5244     /*tor-fw-helper cli looks like this: tor_fw_helper -p :5555 -p 4555:1111 */
5245     const char **argv; /* cli arguments */
5246     int args_n, status;
5247     int argv_index = 0; /* index inside 'argv' */
5248
5249     tor_assert(smartlist_len(ports_to_forward) > 0);
5250
5251     /* check for overflow during 'argv' allocation:
5252        (len(ports_to_forward)*2 + 2)*sizeof(char*) > SIZE_MAX ==
5253        len(ports_to_forward) > (((SIZE_MAX/sizeof(char*)) - 2)/2) */
5254     if ((size_t) smartlist_len(ports_to_forward) >
5255         (((SIZE_MAX/sizeof(char*)) - 2)/2)) {
5256       log_warn(LD_GENERAL,
5257                "Overflow during argv allocation. This shouldn't happen.");
5258       return;
5259     }
5260     /* check for overflow during 'argv_index' increase:
5261        ((len(ports_to_forward)*2 + 2) > INT_MAX) ==
5262        len(ports_to_forward) > (INT_MAX - 2)/2 */
5263     if (smartlist_len(ports_to_forward) > (INT_MAX - 2)/2) {
5264       log_warn(LD_GENERAL,
5265                "Overflow during argv_index increase. This shouldn't happen.");
5266       return;
5267     }
5268
5269     /* Calculate number of cli arguments: one for the filename, two
5270        for each smartlist element (one for "-p" and one for the
5271        ports), and one for the final NULL. */
5272     args_n = 1 + 2*smartlist_len(ports_to_forward) + 1;
5273     argv = tor_calloc(args_n, sizeof(char *));
5274
5275     argv[argv_index++] = filename;
5276     SMARTLIST_FOREACH_BEGIN(ports_to_forward, const char *, port) {
5277       argv[argv_index++] = "-p";
5278       argv[argv_index++] = port;
5279     } SMARTLIST_FOREACH_END(port);
5280     argv[argv_index] = NULL;
5281
5282     /* Assume tor-fw-helper will succeed, start it later*/
5283     time_to_run_helper = now + TIME_TO_EXEC_FWHELPER_SUCCESS;
5284
5285     if (child_handle) {
5286       tor_process_handle_destroy(child_handle, 1);
5287       child_handle = NULL;
5288     }
5289
5290 #ifdef _WIN32
5291     /* Passing NULL as lpApplicationName makes Windows search for the .exe */
5292     status = tor_spawn_background(NULL, argv, NULL, &child_handle);
5293 #else
5294     status = tor_spawn_background(filename, argv, NULL, &child_handle);
5295 #endif
5296
5297     tor_free_((void*)argv);
5298     argv=NULL;
5299
5300     if (PROCESS_STATUS_ERROR == status) {
5301       log_warn(LD_GENERAL, "Failed to start port forwarding helper %s",
5302               filename);
5303       time_to_run_helper = now + TIME_TO_EXEC_FWHELPER_FAIL;
5304       return;
5305     }
5306
5307     log_info(LD_GENERAL,
5308              "Started port forwarding helper (%s) with pid '%d'",
5309              filename, tor_process_get_pid(child_handle));
5310   }
5311
5312   /* If child is running, read from its stdout and stderr) */
5313   if (child_handle && PROCESS_STATUS_RUNNING == child_handle->status) {
5314     /* Read from stdout/stderr and log result */
5315     retval = 0;
5316 #ifdef _WIN32
5317     stderr_status = log_from_handle(child_handle->stderr_pipe, LOG_INFO);
5318 #else
5319     stderr_status = log_from_pipe(child_handle->stderr_handle,
5320                                   LOG_INFO, filename, &retval);
5321 #endif
5322     if (handle_fw_helper_output(filename, child_handle) < 0) {
5323       log_warn(LD_GENERAL, "Failed to handle fw helper output.");
5324       stdout_status = -1;
5325       retval = -1;
5326     }
5327
5328     if (retval) {
5329       /* There was a problem in the child process */
5330       time_to_run_helper = now + TIME_TO_EXEC_FWHELPER_FAIL;
5331     }
5332
5333     /* Combine the two statuses in order of severity */
5334     if (-1 == stdout_status || -1 == stderr_status)
5335       /* There was a failure */
5336       retval = -1;
5337 #ifdef _WIN32
5338     else if (!child_handle || tor_get_exit_code(child_handle, 0, NULL) !=
5339              PROCESS_EXIT_RUNNING) {
5340       /* process has exited or there was an error */
5341       /* TODO: Do something with the process return value */
5342       /* TODO: What if the process output something since
5343        * between log_from_handle and tor_get_exit_code? */
5344       retval = 1;
5345     }
5346 #else
5347     else if (1 == stdout_status || 1 == stderr_status)
5348       /* stdout or stderr was closed, the process probably
5349        * exited. It will be reaped by waitpid() in main.c */
5350       /* TODO: Do something with the process return value */
5351       retval = 1;
5352 #endif
5353     else
5354       /* Both are fine */
5355       retval = 0;
5356
5357     /* If either pipe indicates a failure, act on it */
5358     if (0 != retval) {
5359       if (1 == retval) {
5360         log_info(LD_GENERAL, "Port forwarding helper terminated");
5361         child_handle->status = PROCESS_STATUS_NOTRUNNING;
5362       } else {
5363         log_warn(LD_GENERAL, "Failed to read from port forwarding helper");
5364         child_handle->status = PROCESS_STATUS_ERROR;
5365       }
5366
5367       /* TODO: The child might not actually be finished (maybe it failed or
5368          closed stdout/stderr), so maybe we shouldn't start another? */
5369     }
5370   }
5371 }
5372
5373 /** Initialize the insecure RNG <b>rng</b> from a seed value <b>seed</b>. */
5374 void
5375 tor_init_weak_random(tor_weak_rng_t *rng, unsigned seed)
5376 {
5377   rng->state = (uint32_t)(seed & 0x7fffffff);
5378 }
5379
5380 /** Return a randomly chosen value in the range 0..TOR_WEAK_RANDOM_MAX based
5381  * on the RNG state of <b>rng</b>.  This entropy will not be cryptographically
5382  * strong; do not rely on it for anything an adversary should not be able to
5383  * predict. */
5384 int32_t
5385 tor_weak_random(tor_weak_rng_t *rng)
5386 {
5387   /* Here's a linear congruential generator. OpenBSD and glibc use these
5388    * parameters; they aren't too bad, and should have maximal period over the
5389    * range 0..INT32_MAX. We don't want to use the platform rand() or random(),
5390    * since some platforms have bad weak RNGs that only return values in the
5391    * range 0..INT16_MAX, which just isn't enough. */
5392   rng->state = (rng->state * 1103515245 + 12345) & 0x7fffffff;
5393   return (int32_t) rng->state;
5394 }
5395
5396 /** Return a random number in the range [0 , <b>top</b>). {That is, the range
5397  * of integers i such that 0 <= i < top.}  Chooses uniformly.  Requires that
5398  * top is greater than 0. This randomness is not cryptographically strong; do
5399  * not rely on it for anything an adversary should not be able to predict. */
5400 int32_t
5401 tor_weak_random_range(tor_weak_rng_t *rng, int32_t top)
5402 {
5403   /* We don't want to just do tor_weak_random() % top, since random() is often
5404    * implemented with an LCG whose modulus is a power of 2, and those are
5405    * cyclic in their low-order bits. */
5406   int divisor, result;
5407   tor_assert(top > 0);
5408   divisor = TOR_WEAK_RANDOM_MAX / top;
5409   do {
5410     result = (int32_t)(tor_weak_random(rng) / divisor);
5411   } while (result >= top);
5412   return result;
5413 }
5414
5415 /** Cast a given double value to a int64_t. Return 0 if number is NaN.
5416  * Returns either INT64_MIN or INT64_MAX if number is outside of the int64_t
5417  * range. */
5418 int64_t
5419 clamp_double_to_int64(double number)
5420 {
5421   int exp;
5422
5423   /* NaN is a special case that can't be used with the logic below. */
5424   if (isnan(number)) {
5425     return 0;
5426   }
5427
5428   /* Time to validate if result can overflows a int64_t value. Fun with
5429    * float! Find that exponent exp such that
5430    *    number == x * 2^exp
5431    * for some x with abs(x) in [0.5, 1.0). Note that this implies that the
5432    * magnitude of number is strictly less than 2^exp.
5433    *
5434    * If number is infinite, the call to frexp is legal but the contents of
5435    * exp are unspecified. */
5436   frexp(number, &exp);
5437
5438   /* If the magnitude of number is strictly less than 2^63, the truncated
5439    * version of number is guaranteed to be representable. The only
5440    * representable integer for which this is not the case is INT64_MIN, but
5441    * it is covered by the logic below. */
5442   if (isfinite(number) && exp <= 63) {
5443     return number;
5444   }
5445
5446   /* Handle infinities and finite numbers with magnitude >= 2^63. */
5447   return signbit(number) ? INT64_MIN : INT64_MAX;
5448 }
5449