src/common/util.c

   1 /* Copyright (c) 2003, Roger Dingledine
   2  * Copyright (c) 2004-2006, Roger Dingledine, Nick Mathewson.
   3  * Copyright (c) 2007-2015, The Tor Project, Inc. */
   4 /* See LICENSE for licensing information */
   5
   6 /**
   7  * \file util.c
   8  * \brief Common functions for strings, IO, network, data structures,
   9  * process control.
  10  **/
  11
  12 /* This is required on rh7 to make strptime not complain.
  13  */
  14 #define _GNU_SOURCE
  15
  16 #include "orconfig.h"
  17 #ifdef HAVE_FCNTL_H
  18 #include <fcntl.h>
  19 #endif
  20 #define UTIL_PRIVATE
  21 #include "util.h"
  22 #include "torlog.h"
  23 #include "crypto.h"
  24 #include "torint.h"
  25 #include "container.h"
  26 #include "address.h"
  27 #include "sandbox.h"
  28 #include "backtrace.h"
  29 #include "util_process.h"
  30
  31 #ifdef _WIN32
  32 #include <io.h>
  33 #include <direct.h>
  34 #include <process.h>
  35 #include <tchar.h>
  36 #include <winbase.h>
  37 #else
  38 #include <dirent.h>
  39 #include <pwd.h>
  40 #include <grp.h>
  41 #endif
  42
  43 /* math.h needs this on Linux */
  44 #ifndef _USE_ISOC99_
  45 #define _USE_ISOC99_ 1
  46 #endif
  47 #include <math.h>
  48 #include <stdlib.h>
  49 #include <stdio.h>
  50 #include <string.h>
  51 #include <assert.h>
  52 #include <signal.h>
  53
  54 #ifdef HAVE_NETINET_IN_H
  55 #include <netinet/in.h>
  56 #endif
  57 #ifdef HAVE_ARPA_INET_H
  58 #include <arpa/inet.h>
  59 #endif
  60 #ifdef HAVE_ERRNO_H
  61 #include <errno.h>
  62 #endif
  63 #ifdef HAVE_SYS_SOCKET_H
  64 #include <sys/socket.h>
  65 #endif
  66 #ifdef HAVE_SYS_TIME_H
  67 #include <sys/time.h>
  68 #endif
  69 #ifdef HAVE_UNISTD_H
  70 #include <unistd.h>
  71 #endif
  72 #ifdef HAVE_SYS_STAT_H
  73 #include <sys/stat.h>
  74 #endif
  75 #ifdef HAVE_SYS_FCNTL_H
  76 #include <sys/fcntl.h>
  77 #endif
  78 #ifdef HAVE_TIME_H
  79 #include <time.h>
  80 #endif
  81 #ifdef HAVE_MALLOC_MALLOC_H
  82 #include <malloc/malloc.h>
  83 #endif
  84 #ifdef HAVE_MALLOC_H
  85 #if !defined(OPENBSD) && !defined(__FreeBSD__)
  86 /* OpenBSD has a malloc.h, but for our purposes, it only exists in order to
  87  * scold us for being so stupid as to autodetect its presence.  To be fair,
  88  * they've done this since 1996, when autoconf was only 5 years old. */
  89 #include <malloc.h>
  90 #endif
  91 #endif
  92 #ifdef HAVE_MALLOC_NP_H
  93 #include <malloc_np.h>
  94 #endif
  95 #ifdef HAVE_SYS_WAIT_H
  96 #include <sys/wait.h>
  97 #endif
  98 #if defined(HAVE_SYS_PRCTL_H) && defined(__linux__)
  99 #include <sys/prctl.h>
 100 #endif
 101
 102 #ifdef __clang_analyzer__
 103 #undef MALLOC_ZERO_WORKS
 104 #endif
 105
 106 /* =====
 107  * Assertion helper.
 108  * ===== */
 109 /** Helper for tor_assert: report the assertion failure. */
 110 void
 111 tor_assertion_failed_(const char *fname, unsigned int line,
 112                       const char *func, const char *expr)
 113 {
 114   char buf[256];
 115   log_err(LD_BUG, "%s:%u: %s: Assertion %s failed; aborting.",
 116           fname, line, func, expr);
 117   tor_snprintf(buf, sizeof(buf),
 118                "Assertion %s failed in %s at %s:%u",
 119                expr, func, fname, line);
 120   log_backtrace(LOG_ERR, LD_BUG, buf);
 121 }
 122
 123 /* =====
 124  * Memory management
 125  * ===== */
 126 #ifdef USE_DMALLOC
 127  #undef strndup
 128  #include <dmalloc.h>
 129  /* Macro to pass the extra dmalloc args to another function. */
 130  #define DMALLOC_FN_ARGS , file, line
 131
 132  #if defined(HAVE_DMALLOC_STRDUP)
 133  /* the dmalloc_strdup should be fine as defined */
 134  #elif defined(HAVE_DMALLOC_STRNDUP)
 135  #define dmalloc_strdup(file, line, string, xalloc_b) \
 136          dmalloc_strndup(file, line, (string), -1, xalloc_b)
 137  #else
 138  #error "No dmalloc_strdup or equivalent"
 139  #endif
 140
 141 #else /* not using dmalloc */
 142
 143  #define DMALLOC_FN_ARGS
 144 #endif
 145
 146 /** Allocate a chunk of <b>size</b> bytes of memory, and return a pointer to
 147  * result.  On error, log and terminate the process.  (Same as malloc(size),
 148  * but never returns NULL.)
 149  *
 150  * <b>file</b> and <b>line</b> are used if dmalloc is enabled, and
 151  * ignored otherwise.
 152  */
 153 void *
 154 tor_malloc_(size_t size DMALLOC_PARAMS)
 155 {
 156   void *result;
 157
 158   tor_assert(size < SIZE_T_CEILING);
 159
 160 #ifndef MALLOC_ZERO_WORKS
 161   /* Some libc mallocs don't work when size==0. Override them. */
 162   if (size==0) {
 163     size=1;
 164   }
 165 #endif
 166
 167 #ifdef USE_DMALLOC
 168   result = dmalloc_malloc(file, line, size, DMALLOC_FUNC_MALLOC, 0, 0);
 169 #else
 170   result = malloc(size);
 171 #endif
 172
 173   if (PREDICT_UNLIKELY(result == NULL)) {
 174     log_err(LD_MM,"Out of memory on malloc(). Dying.");
 175     /* If these functions die within a worker process, they won't call
 176      * spawn_exit, but that's ok, since the parent will run out of memory soon
 177      * anyway. */
 178     exit(1);
 179   }
 180   return result;
 181 }
 182
 183 /** Allocate a chunk of <b>size</b> bytes of memory, fill the memory with
 184  * zero bytes, and return a pointer to the result.  Log and terminate
 185  * the process on error.  (Same as calloc(size,1), but never returns NULL.)
 186  */
 187 void *
 188 tor_malloc_zero_(size_t size DMALLOC_PARAMS)
 189 {
 190   /* You may ask yourself, "wouldn't it be smart to use calloc instead of
 191    * malloc+memset?  Perhaps libc's calloc knows some nifty optimization trick
 192    * we don't!"  Indeed it does, but its optimizations are only a big win when
 193    * we're allocating something very big (it knows if it just got the memory
 194    * from the OS in a pre-zeroed state).  We don't want to use tor_malloc_zero
 195    * for big stuff, so we don't bother with calloc. */
 196   void *result = tor_malloc_(size DMALLOC_FN_ARGS);
 197   memset(result, 0, size);
 198   return result;
 199 }
 200
 201 /* The square root of SIZE_MAX + 1.  If a is less than this, and b is less
 202  * than this, then a*b is less than SIZE_MAX.  (For example, if size_t is
 203  * 32 bits, then SIZE_MAX is 0xffffffff and this value is 0x10000.  If a and
 204  * b are less than this, then their product is at most (65535*65535) ==
 205  * 0xfffe0001. */
 206 #define SQRT_SIZE_MAX_P1 (((size_t)1) << (sizeof(size_t)*4))
 207
 208 /** Return non-zero if and only if the product of the arguments is exact. */
 209 static INLINE int
 210 size_mul_check(const size_t x, const size_t y)
 211 {
 212   /* This first check is equivalent to
 213      (x < SQRT_SIZE_MAX_P1 && y < SQRT_SIZE_MAX_P1)
 214
 215      Rationale: if either one of x or y is >= SQRT_SIZE_MAX_P1, then it
 216      will have some bit set in its most significant half.
 217    */
 218   return ((x|y) < SQRT_SIZE_MAX_P1 ||
 219           y == 0 ||
 220           x <= SIZE_MAX / y);
 221 }
 222
 223 /** Allocate a chunk of <b>nmemb</b>*<b>size</b> bytes of memory, fill
 224  * the memory with zero bytes, and return a pointer to the result.
 225  * Log and terminate the process on error.  (Same as
 226  * calloc(<b>nmemb</b>,<b>size</b>), but never returns NULL.)
 227  * The second argument (<b>size</b>) should preferably be non-zero
 228  * and a compile-time constant.
 229  */
 230 void *
 231 tor_calloc_(size_t nmemb, size_t size DMALLOC_PARAMS)
 232 {
 233   tor_assert(size_mul_check(nmemb, size));
 234   return tor_malloc_zero_((nmemb * size) DMALLOC_FN_ARGS);
 235 }
 236
 237 /** Change the size of the memory block pointed to by <b>ptr</b> to <b>size</b>
 238  * bytes long; return the new memory block.  On error, log and
 239  * terminate. (Like realloc(ptr,size), but never returns NULL.)
 240  */
 241 void *
 242 tor_realloc_(void *ptr, size_t size DMALLOC_PARAMS)
 243 {
 244   void *result;
 245
 246   tor_assert(size < SIZE_T_CEILING);
 247
 248 #ifndef MALLOC_ZERO_WORKS
 249   /* Some libc mallocs don't work when size==0. Override them. */
 250   if (size==0) {
 251     size=1;
 252   }
 253 #endif
 254
 255 #ifdef USE_DMALLOC
 256   result = dmalloc_realloc(file, line, ptr, size, DMALLOC_FUNC_REALLOC, 0);
 257 #else
 258   result = realloc(ptr, size);
 259 #endif
 260
 261   if (PREDICT_UNLIKELY(result == NULL)) {
 262     log_err(LD_MM,"Out of memory on realloc(). Dying.");
 263     exit(1);
 264   }
 265   return result;
 266 }
 267
 268 /**
 269  * Try to realloc <b>ptr</b> so that it takes up sz1 * sz2 bytes.  Check for
 270  * overflow. Unlike other allocation functions, return NULL on overflow.
 271  */
 272 void *
 273 tor_reallocarray_(void *ptr, size_t sz1, size_t sz2 DMALLOC_PARAMS)
 274 {
 275   /* XXXX we can make this return 0, but we would need to check all the
 276    * reallocarray users. */
 277   tor_assert(size_mul_check(sz1, sz2));
 278
 279   return tor_realloc(ptr, (sz1 * sz2) DMALLOC_FN_ARGS);
 280 }
 281
 282 /** Return a newly allocated copy of the NUL-terminated string s. On
 283  * error, log and terminate.  (Like strdup(s), but never returns
 284  * NULL.)
 285  */
 286 char *
 287 tor_strdup_(const char *s DMALLOC_PARAMS)
 288 {
 289   char *dup;
 290   tor_assert(s);
 291
 292 #ifdef USE_DMALLOC
 293   dup = dmalloc_strdup(file, line, s, 0);
 294 #else
 295   dup = strdup(s);
 296 #endif
 297   if (PREDICT_UNLIKELY(dup == NULL)) {
 298     log_err(LD_MM,"Out of memory on strdup(). Dying.");
 299     exit(1);
 300   }
 301   return dup;
 302 }
 303
 304 /** Allocate and return a new string containing the first <b>n</b>
 305  * characters of <b>s</b>.  If <b>s</b> is longer than <b>n</b>
 306  * characters, only the first <b>n</b> are copied.  The result is
 307  * always NUL-terminated.  (Like strndup(s,n), but never returns
 308  * NULL.)
 309  */
 310 char *
 311 tor_strndup_(const char *s, size_t n DMALLOC_PARAMS)
 312 {
 313   char *dup;
 314   tor_assert(s);
 315   tor_assert(n < SIZE_T_CEILING);
 316   dup = tor_malloc_((n+1) DMALLOC_FN_ARGS);
 317   /* Performance note: Ordinarily we prefer strlcpy to strncpy.  But
 318    * this function gets called a whole lot, and platform strncpy is
 319    * much faster than strlcpy when strlen(s) is much longer than n.
 320    */
 321   strncpy(dup, s, n);
 322   dup[n]='\0';
 323   return dup;
 324 }
 325
 326 /** Allocate a chunk of <b>len</b> bytes, with the same contents as the
 327  * <b>len</b> bytes starting at <b>mem</b>. */
 328 void *
 329 tor_memdup_(const void *mem, size_t len DMALLOC_PARAMS)
 330 {
 331   char *dup;
 332   tor_assert(len < SIZE_T_CEILING);
 333   tor_assert(mem);
 334   dup = tor_malloc_(len DMALLOC_FN_ARGS);
 335   memcpy(dup, mem, len);
 336   return dup;
 337 }
 338
 339 /** As tor_memdup(), but add an extra 0 byte at the end of the resulting
 340  * memory. */
 341 void *
 342 tor_memdup_nulterm_(const void *mem, size_t len DMALLOC_PARAMS)
 343 {
 344   char *dup;
 345   tor_assert(len < SIZE_T_CEILING+1);
 346   tor_assert(mem);
 347   dup = tor_malloc_(len+1 DMALLOC_FN_ARGS);
 348   memcpy(dup, mem, len);
 349   dup[len] = '\0';
 350   return dup;
 351 }
 352
 353 /** Helper for places that need to take a function pointer to the right
 354  * spelling of "free()". */
 355 void
 356 tor_free_(void *mem)
 357 {
 358   tor_free(mem);
 359 }
 360
 361 /** Call the platform malloc info function, and dump the results to the log at
 362  * level <b>severity</b>.  If no such function exists, do nothing. */
 363 void
 364 tor_log_mallinfo(int severity)
 365 {
 366 #ifdef HAVE_MALLINFO
 367   struct mallinfo mi;
 368   memset(&mi, 0, sizeof(mi));
 369   mi = mallinfo();
 370   tor_log(severity, LD_MM,
 371       "mallinfo() said: arena=%d, ordblks=%d, smblks=%d, hblks=%d, "
 372       "hblkhd=%d, usmblks=%d, fsmblks=%d, uordblks=%d, fordblks=%d, "
 373       "keepcost=%d",
 374       mi.arena, mi.ordblks, mi.smblks, mi.hblks,
 375       mi.hblkhd, mi.usmblks, mi.fsmblks, mi.uordblks, mi.fordblks,
 376       mi.keepcost);
 377 #else
 378   (void)severity;
 379 #endif
 380 #ifdef USE_DMALLOC
 381   dmalloc_log_changed(0, /* Since the program started. */
 382                       1, /* Log info about non-freed pointers. */
 383                       0, /* Do not log info about freed pointers. */
 384                       0  /* Do not log individual pointers. */
 385                       );
 386 #endif
 387 }
 388
 389 /* =====
 390  * Math
 391  * ===== */
 392
 393 /**
 394  * Returns the natural logarithm of d base e.  We defined this wrapper here so
 395  * to avoid conflicts with old versions of tor_log(), which were named log().
 396  */
 397 double
 398 tor_mathlog(double d)
 399 {
 400   return log(d);
 401 }
 402
 403 /** Return the long integer closest to <b>d</b>. We define this wrapper
 404  * here so that not all users of math.h need to use the right incantations
 405  * to get the c99 functions. */
 406 long
 407 tor_lround(double d)
 408 {
 409 #if defined(HAVE_LROUND)
 410   return lround(d);
 411 #elif defined(HAVE_RINT)
 412   return (long)rint(d);
 413 #else
 414   return (long)(d > 0 ? d + 0.5 : ceil(d - 0.5));
 415 #endif
 416 }
 417
 418 /** Return the 64-bit integer closest to d.  We define this wrapper here so
 419  * that not all users of math.h need to use the right incantations to get the
 420  * c99 functions. */
 421 int64_t
 422 tor_llround(double d)
 423 {
 424 #if defined(HAVE_LLROUND)
 425   return (int64_t)llround(d);
 426 #elif defined(HAVE_RINT)
 427   return (int64_t)rint(d);
 428 #else
 429   return (int64_t)(d > 0 ? d + 0.5 : ceil(d - 0.5));
 430 #endif
 431 }
 432
 433 /** Returns floor(log2(u64)).  If u64 is 0, (incorrectly) returns 0. */
 434 int
 435 tor_log2(uint64_t u64)
 436 {
 437   int r = 0;
 438   if (u64 >= (U64_LITERAL(1)<<32)) {
 439     u64 >>= 32;
 440     r = 32;
 441   }
 442   if (u64 >= (U64_LITERAL(1)<<16)) {
 443     u64 >>= 16;
 444     r += 16;
 445   }
 446   if (u64 >= (U64_LITERAL(1)<<8)) {
 447     u64 >>= 8;
 448     r += 8;
 449   }
 450   if (u64 >= (U64_LITERAL(1)<<4)) {
 451     u64 >>= 4;
 452     r += 4;
 453   }
 454   if (u64 >= (U64_LITERAL(1)<<2)) {
 455     u64 >>= 2;
 456     r += 2;
 457   }
 458   if (u64 >= (U64_LITERAL(1)<<1)) {
 459     u64 >>= 1;
 460     r += 1;
 461   }
 462   return r;
 463 }
 464
 465 /** Return the power of 2 in range [1,UINT64_MAX] closest to <b>u64</b>.  If
 466  * there are two powers of 2 equally close, round down. */
 467 uint64_t
 468 round_to_power_of_2(uint64_t u64)
 469 {
 470   int lg2;
 471   uint64_t low;
 472   uint64_t high;
 473   if (u64 == 0)
 474     return 1;
 475
 476   lg2 = tor_log2(u64);
 477   low = U64_LITERAL(1) << lg2;
 478
 479   if (lg2 == 63)
 480     return low;
 481
 482   high = U64_LITERAL(1) << (lg2+1);
 483   if (high - u64 < u64 - low)
 484     return high;
 485   else
 486     return low;
 487 }
 488
 489 /** Return the lowest x such that x is at least <b>number</b>, and x modulo
 490  * <b>divisor</b> == 0. */
 491 unsigned
 492 round_to_next_multiple_of(unsigned number, unsigned divisor)
 493 {
 494   tor_assert(divisor > 0);
 495   if (UINT_MAX - divisor + 1 >= number)
 496     number += divisor - 1;
 497   number -= number % divisor;
 498   return number;
 499 }
 500
 501 /** Return the lowest x such that x is at least <b>number</b>, and x modulo
 502  * <b>divisor</b> == 0. */
 503 uint32_t
 504 round_uint32_to_next_multiple_of(uint32_t number, uint32_t divisor)
 505 {
 506   tor_assert(divisor > 0);
 507   if (UINT32_MAX - divisor + 1 >= number)
 508     number += divisor - 1;
 509   number -= number % divisor;
 510   return number;
 511 }
 512
 513 /** Return the lowest x such that x is at least <b>number</b>, and x modulo
 514  * <b>divisor</b> == 0. */
 515 uint64_t
 516 round_uint64_to_next_multiple_of(uint64_t number, uint64_t divisor)
 517 {
 518   tor_assert(divisor > 0);
 519   if (UINT64_MAX - divisor + 1 >= number)
 520     number += divisor - 1;
 521   number -= number % divisor;
 522   return number;
 523 }
 524
 525 /** Return the lowest x in [INT64_MIN, INT64_MAX] such that x is at least
 526  * <b>number</b>, and x modulo <b>divisor</b> == 0. */
 527 int64_t
 528 round_int64_to_next_multiple_of(int64_t number, int64_t divisor)
 529 {
 530   tor_assert(divisor > 0);
 531   if (number >= 0 && INT64_MAX - divisor + 1 >= number)
 532     number += divisor - 1;
 533   number -= number % divisor;
 534   return number;
 535 }
 536
 537 /** Transform a random value <b>p</b> from the uniform distribution in
 538  * [0.0, 1.0[ into a Laplace distributed value with location parameter
 539  * <b>mu</b> and scale parameter <b>b</b>. Truncate the final result
 540  * to be an integer in [INT64_MIN, INT64_MAX]. */
 541 int64_t
 542 sample_laplace_distribution(double mu, double b, double p)
 543 {
 544   double result;
 545   tor_assert(p >= 0.0 && p < 1.0);
 546
 547   /* This is the "inverse cumulative distribution function" from:
 548    * http://en.wikipedia.org/wiki/Laplace_distribution */
 549   if (p <= 0.0) {
 550     /* Avoid taking log(0.0) == -INFINITY, as some processors or compiler
 551      * options can cause the program to trap. */
 552     return INT64_MIN;
 553   }
 554
 555   result = mu - b * (p > 0.5 ? 1.0 : -1.0)
 556                   * tor_mathlog(1.0 - 2.0 * fabs(p - 0.5));
 557
 558   return cast_double_to_int64(result);
 559 }
 560
 561 /** Add random noise between INT64_MIN and INT64_MAX coming from a Laplace
 562  * distribution with mu = 0 and b = <b>delta_f</b>/<b>epsilon</b> to
 563  * <b>signal</b> based on the provided <b>random</b> value in [0.0, 1.0[.
 564  * The epsilon value must be between ]0.0, 1.0]. delta_f must be greater
 565  * than 0. */
 566 int64_t
 567 add_laplace_noise(int64_t signal, double random, double delta_f,
 568                   double epsilon)
 569 {
 570   int64_t noise;
 571
 572   /* epsilon MUST be between ]0.0, 1.0] */
 573   tor_assert(epsilon > 0.0 && epsilon <= 1.0);
 574   /* delta_f MUST be greater than 0. */
 575   tor_assert(delta_f > 0.0);
 576
 577   /* Just add noise, no further signal */
 578   noise = sample_laplace_distribution(0.0,
 579                                       delta_f / epsilon,
 580                                       random);
 581
 582   /* Clip (signal + noise) to [INT64_MIN, INT64_MAX] */
 583   if (noise > 0 && INT64_MAX - noise < signal)
 584     return INT64_MAX;
 585   else if (noise < 0 && INT64_MIN - noise > signal)
 586     return INT64_MIN;
 587   else
 588     return signal + noise;
 589 }
 590
 591 /** Return the number of bits set in <b>v</b>. */
 592 int
 593 n_bits_set_u8(uint8_t v)
 594 {
 595   static const int nybble_table[] = {
 596     0, /* 0000 */
 597     1, /* 0001 */
 598     1, /* 0010 */
 599     2, /* 0011 */
 600     1, /* 0100 */
 601     2, /* 0101 */
 602     2, /* 0110 */
 603     3, /* 0111 */
 604     1, /* 1000 */
 605     2, /* 1001 */
 606     2, /* 1010 */
 607     3, /* 1011 */
 608     2, /* 1100 */
 609     3, /* 1101 */
 610     3, /* 1110 */
 611     4, /* 1111 */
 612   };
 613
 614   return nybble_table[v & 15] + nybble_table[v>>4];
 615 }
 616
 617 /* =====
 618  * String manipulation
 619  * ===== */
 620
 621 /** Remove from the string <b>s</b> every character which appears in
 622  * <b>strip</b>. */
 623 void
 624 tor_strstrip(char *s, const char *strip)
 625 {
 626   char *read = s;
 627   while (*read) {
 628     if (strchr(strip, *read)) {
 629       ++read;
 630     } else {
 631       *s++ = *read++;
 632     }
 633   }
 634   *s = '\0';
 635 }
 636
 637 /** Return a pointer to a NUL-terminated hexadecimal string encoding
 638  * the first <b>fromlen</b> bytes of <b>from</b>. (fromlen must be \<= 32.) The
 639  * result does not need to be deallocated, but repeated calls to
 640  * hex_str will trash old results.
 641  */
 642 const char *
 643 hex_str(const char *from, size_t fromlen)
 644 {
 645   static char buf[65];
 646   if (fromlen>(sizeof(buf)-1)/2)
 647     fromlen = (sizeof(buf)-1)/2;
 648   base16_encode(buf,sizeof(buf),from,fromlen);
 649   return buf;
 650 }
 651
 652 /** Convert all alphabetic characters in the nul-terminated string <b>s</b> to
 653  * lowercase. */
 654 void
 655 tor_strlower(char *s)
 656 {
 657   while (*s) {
 658     *s = TOR_TOLOWER(*s);
 659     ++s;
 660   }
 661 }
 662
 663 /** Convert all alphabetic characters in the nul-terminated string <b>s</b> to
 664  * lowercase. */
 665 void
 666 tor_strupper(char *s)
 667 {
 668   while (*s) {
 669     *s = TOR_TOUPPER(*s);
 670     ++s;
 671   }
 672 }
 673
 674 /** Return 1 if every character in <b>s</b> is printable, else return 0.
 675  */
 676 int
 677 tor_strisprint(const char *s)
 678 {
 679   while (*s) {
 680     if (!TOR_ISPRINT(*s))
 681       return 0;
 682     s++;
 683   }
 684   return 1;
 685 }
 686
 687 /** Return 1 if no character in <b>s</b> is uppercase, else return 0.
 688  */
 689 int
 690 tor_strisnonupper(const char *s)
 691 {
 692   while (*s) {
 693     if (TOR_ISUPPER(*s))
 694       return 0;
 695     s++;
 696   }
 697   return 1;
 698 }
 699
 700 /** As strcmp, except that either string may be NULL.  The NULL string is
 701  * considered to be before any non-NULL string. */
 702 int
 703 strcmp_opt(const char *s1, const char *s2)
 704 {
 705   if (!s1) {
 706     if (!s2)
 707       return 0;
 708     else
 709       return -1;
 710   } else if (!s2) {
 711     return 1;
 712   } else {
 713     return strcmp(s1, s2);
 714   }
 715 }
 716
 717 /** Compares the first strlen(s2) characters of s1 with s2.  Returns as for
 718  * strcmp.
 719  */
 720 int
 721 strcmpstart(const char *s1, const char *s2)
 722 {
 723   size_t n = strlen(s2);
 724   return strncmp(s1, s2, n);
 725 }
 726
 727 /** Compare the s1_len-byte string <b>s1</b> with <b>s2</b>,
 728  * without depending on a terminating nul in s1.  Sorting order is first by
 729  * length, then lexically; return values are as for strcmp.
 730  */
 731 int
 732 strcmp_len(const char *s1, const char *s2, size_t s1_len)
 733 {
 734   size_t s2_len = strlen(s2);
 735   if (s1_len < s2_len)
 736     return -1;
 737   if (s1_len > s2_len)
 738     return 1;
 739   return fast_memcmp(s1, s2, s2_len);
 740 }
 741
 742 /** Compares the first strlen(s2) characters of s1 with s2.  Returns as for
 743  * strcasecmp.
 744  */
 745 int
 746 strcasecmpstart(const char *s1, const char *s2)
 747 {
 748   size_t n = strlen(s2);
 749   return strncasecmp(s1, s2, n);
 750 }
 751
 752 /** Compares the last strlen(s2) characters of s1 with s2.  Returns as for
 753  * strcmp.
 754  */
 755 int
 756 strcmpend(const char *s1, const char *s2)
 757 {
 758   size_t n1 = strlen(s1), n2 = strlen(s2);
 759   if (n2>n1)
 760     return strcmp(s1,s2);
 761   else
 762     return strncmp(s1+(n1-n2), s2, n2);
 763 }
 764
 765 /** Compares the last strlen(s2) characters of s1 with s2.  Returns as for
 766  * strcasecmp.
 767  */
 768 int
 769 strcasecmpend(const char *s1, const char *s2)
 770 {
 771   size_t n1 = strlen(s1), n2 = strlen(s2);
 772   if (n2>n1) /* then they can't be the same; figure out which is bigger */
 773     return strcasecmp(s1,s2);
 774   else
 775     return strncasecmp(s1+(n1-n2), s2, n2);
 776 }
 777
 778 /** Compare the value of the string <b>prefix</b> with the start of the
 779  * <b>memlen</b>-byte memory chunk at <b>mem</b>.  Return as for strcmp.
 780  *
 781  * [As fast_memcmp(mem, prefix, strlen(prefix)) but returns -1 if memlen is
 782  * less than strlen(prefix).]
 783  */
 784 int
 785 fast_memcmpstart(const void *mem, size_t memlen,
 786                 const char *prefix)
 787 {
 788   size_t plen = strlen(prefix);
 789   if (memlen < plen)
 790     return -1;
 791   return fast_memcmp(mem, prefix, plen);
 792 }
 793
 794 /** Return a pointer to the first char of s that is not whitespace and
 795  * not a comment, or to the terminating NUL if no such character exists.
 796  */
 797 const char *
 798 eat_whitespace(const char *s)
 799 {
 800   tor_assert(s);
 801
 802   while (1) {
 803     switch (*s) {
 804     case '\0':
 805     default:
 806       return s;
 807     case ' ':
 808     case '\t':
 809     case '\n':
 810     case '\r':
 811       ++s;
 812       break;
 813     case '#':
 814       ++s;
 815       while (*s && *s != '\n')
 816         ++s;
 817     }
 818   }
 819 }
 820
 821 /** Return a pointer to the first char of s that is not whitespace and
 822  * not a comment, or to the terminating NUL if no such character exists.
 823  */
 824 const char *
 825 eat_whitespace_eos(const char *s, const char *eos)
 826 {
 827   tor_assert(s);
 828   tor_assert(eos && s <= eos);
 829
 830   while (s < eos) {
 831     switch (*s) {
 832     case '\0':
 833     default:
 834       return s;
 835     case ' ':
 836     case '\t':
 837     case '\n':
 838     case '\r':
 839       ++s;
 840       break;
 841     case '#':
 842       ++s;
 843       while (s < eos && *s && *s != '\n')
 844         ++s;
 845     }
 846   }
 847   return s;
 848 }
 849
 850 /** Return a pointer to the first char of s that is not a space or a tab
 851  * or a \\r, or to the terminating NUL if no such character exists. */
 852 const char *
 853 eat_whitespace_no_nl(const char *s)
 854 {
 855   while (*s == ' ' || *s == '\t' || *s == '\r')
 856     ++s;
 857   return s;
 858 }
 859
 860 /** As eat_whitespace_no_nl, but stop at <b>eos</b> whether we have
 861  * found a non-whitespace character or not. */
 862 const char *
 863 eat_whitespace_eos_no_nl(const char *s, const char *eos)
 864 {
 865   while (s < eos && (*s == ' ' || *s == '\t' || *s == '\r'))
 866     ++s;
 867   return s;
 868 }
 869
 870 /** Return a pointer to the first char of s that is whitespace or <b>#</b>,
 871  * or to the terminating NUL if no such character exists.
 872  */
 873 const char *
 874 find_whitespace(const char *s)
 875 {
 876   /* tor_assert(s); */
 877   while (1) {
 878     switch (*s)
 879     {
 880     case '\0':
 881     case '#':
 882     case ' ':
 883     case '\r':
 884     case '\n':
 885     case '\t':
 886       return s;
 887     default:
 888       ++s;
 889     }
 890   }
 891 }
 892
 893 /** As find_whitespace, but stop at <b>eos</b> whether we have found a
 894  * whitespace or not. */
 895 const char *
 896 find_whitespace_eos(const char *s, const char *eos)
 897 {
 898   /* tor_assert(s); */
 899   while (s < eos) {
 900     switch (*s)
 901     {
 902     case '\0':
 903     case '#':
 904     case ' ':
 905     case '\r':
 906     case '\n':
 907     case '\t':
 908       return s;
 909     default:
 910       ++s;
 911     }
 912   }
 913   return s;
 914 }
 915
 916 /** Return the first occurrence of <b>needle</b> in <b>haystack</b> that
 917  * occurs at the start of a line (that is, at the beginning of <b>haystack</b>
 918  * or immediately after a newline).  Return NULL if no such string is found.
 919  */
 920 const char *
 921 find_str_at_start_of_line(const char *haystack, const char *needle)
 922 {
 923   size_t needle_len = strlen(needle);
 924
 925   do {
 926     if (!strncmp(haystack, needle, needle_len))
 927       return haystack;
 928
 929     haystack = strchr(haystack, '\n');
 930     if (!haystack)
 931       return NULL;
 932     else
 933       ++haystack;
 934   } while (*haystack);
 935
 936   return NULL;
 937 }
 938
 939 /** Returns true if <b>string</b> could be a C identifier.
 940     A C identifier must begin with a letter or an underscore and the
 941     rest of its characters can be letters, numbers or underscores. No
 942     length limit is imposed. */
 943 int
 944 string_is_C_identifier(const char *string)
 945 {
 946   size_t iter;
 947   size_t length = strlen(string);
 948   if (!length)
 949     return 0;
 950
 951   for (iter = 0; iter < length ; iter++) {
 952     if (iter == 0) {
 953       if (!(TOR_ISALPHA(string[iter]) ||
 954             string[iter] == '_'))
 955         return 0;
 956     } else {
 957       if (!(TOR_ISALPHA(string[iter]) ||
 958             TOR_ISDIGIT(string[iter]) ||
 959             string[iter] == '_'))
 960         return 0;
 961     }
 962   }
 963
 964   return 1;
 965 }
 966
 967 /** Return true iff the 'len' bytes at 'mem' are all zero. */
 968 int
 969 tor_mem_is_zero(const char *mem, size_t len)
 970 {
 971   static const char ZERO[] = {
 972     0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0,
 973   };
 974   while (len >= sizeof(ZERO)) {
 975     /* It's safe to use fast_memcmp here, since the very worst thing an
 976      * attacker could learn is how many initial bytes of a secret were zero */
 977     if (fast_memcmp(mem, ZERO, sizeof(ZERO)))
 978       return 0;
 979     len -= sizeof(ZERO);
 980     mem += sizeof(ZERO);
 981   }
 982   /* Deal with leftover bytes. */
 983   if (len)
 984     return fast_memeq(mem, ZERO, len);
 985
 986   return 1;
 987 }
 988
 989 /** Return true iff the DIGEST_LEN bytes in digest are all zero. */
 990 int
 991 tor_digest_is_zero(const char *digest)
 992 {
 993   static const uint8_t ZERO_DIGEST[] = {
 994     0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0, 0,0,0,0
 995   };
 996   return tor_memeq(digest, ZERO_DIGEST, DIGEST_LEN);
 997 }
 998
 999 /** Return true if <b>string</b> is a valid 'key=[value]' string.
1000  *  "value" is optional, to indicate the empty string. Log at logging
1001  *  <b>severity</b> if something ugly happens. */
1002 int
1003 string_is_key_value(int severity, const char *string)
1004 {
1005   /* position of equal sign in string */
1006   const char *equal_sign_pos = NULL;
1007
1008   tor_assert(string);
1009
1010   if (strlen(string) < 2) { /* "x=" is shortest args string */
1011     tor_log(severity, LD_GENERAL, "'%s' is too short to be a k=v value.",
1012             escaped(string));
1013     return 0;
1014   }
1015
1016   equal_sign_pos = strchr(string, '=');
1017   if (!equal_sign_pos) {
1018     tor_log(severity, LD_GENERAL, "'%s' is not a k=v value.", escaped(string));
1019     return 0;
1020   }
1021
1022   /* validate that the '=' is not in the beginning of the string. */
1023   if (equal_sign_pos == string) {
1024     tor_log(severity, LD_GENERAL, "'%s' is not a valid k=v value.",
1025             escaped(string));
1026     return 0;
1027   }
1028
1029   return 1;
1030 }
1031
1032 /** Return true if <b>string</b> represents a valid IPv4 adddress in
1033  * 'a.b.c.d' form.
1034  */
1035 int
1036 string_is_valid_ipv4_address(const char *string)
1037 {
1038   struct in_addr addr;
1039
1040   return (tor_inet_pton(AF_INET,string,&addr) == 1);
1041 }
1042
1043 /** Return true if <b>string</b> represents a valid IPv6 address in
1044  * a form that inet_pton() can parse.
1045  */
1046 int
1047 string_is_valid_ipv6_address(const char *string)
1048 {
1049   struct in6_addr addr;
1050
1051   return (tor_inet_pton(AF_INET6,string,&addr) == 1);
1052 }
1053
1054 /** Return true iff <b>string</b> matches a pattern of DNS names
1055  * that we allow Tor clients to connect to.
1056  */
1057 int
1058 string_is_valid_hostname(const char *string)
1059 {
1060   int result = 1;
1061   smartlist_t *components;
1062
1063   components = smartlist_new();
1064
1065   smartlist_split_string(components,string,".",0,0);
1066
1067   SMARTLIST_FOREACH_BEGIN(components, char *, c) {
1068     if (c[0] == '-') {
1069       result = 0;
1070       break;
1071     }
1072
1073     do {
1074       if ((*c >= 'a' && *c <= 'z') ||
1075           (*c >= 'A' && *c <= 'Z') ||
1076           (*c >= '0' && *c <= '9') ||
1077           (*c == '-'))
1078         c++;
1079       else
1080         result = 0;
1081     } while (result && *c);
1082
1083   } SMARTLIST_FOREACH_END(c);
1084
1085   SMARTLIST_FOREACH_BEGIN(components, char *, c) {
1086     tor_free(c);
1087   } SMARTLIST_FOREACH_END(c);
1088
1089   smartlist_free(components);
1090
1091   return result;
1092 }
1093
1094 /** Return true iff the DIGEST256_LEN bytes in digest are all zero. */
1095 int
1096 tor_digest256_is_zero(const char *digest)
1097 {
1098   return tor_mem_is_zero(digest, DIGEST256_LEN);
1099 }
1100
1101 /* Helper: common code to check whether the result of a strtol or strtoul or
1102  * strtoll is correct. */
1103 #define CHECK_STRTOX_RESULT()                           \
1104   /* Did an overflow occur? */                          \
1105   if (errno == ERANGE)                                  \
1106     goto err;                                           \
1107   /* Was at least one character converted? */           \
1108   if (endptr == s)                                      \
1109     goto err;                                           \
1110   /* Were there unexpected unconverted characters? */   \
1111   if (!next && *endptr)                                 \
1112     goto err;                                           \
1113   /* Is r within limits? */                             \
1114   if (r < min || r > max)                               \
1115     goto err;                                           \
1116   if (ok) *ok = 1;                                      \
1117   if (next) *next = endptr;                             \
1118   return r;                                             \
1119  err:                                                   \
1120   if (ok) *ok = 0;                                      \
1121   if (next) *next = endptr;                             \
1122   return 0
1123
1124 /** Extract a long from the start of <b>s</b>, in the given numeric
1125  * <b>base</b>.  If <b>base</b> is 0, <b>s</b> is parsed as a decimal,
1126  * octal, or hex number in the syntax of a C integer literal.  If
1127  * there is unconverted data and <b>next</b> is provided, set
1128  * *<b>next</b> to the first unconverted character.  An error has
1129  * occurred if no characters are converted; or if there are
1130  * unconverted characters and <b>next</b> is NULL; or if the parsed
1131  * value is not between <b>min</b> and <b>max</b>.  When no error
1132  * occurs, return the parsed value and set *<b>ok</b> (if provided) to
1133  * 1.  When an error occurs, return 0 and set *<b>ok</b> (if provided)
1134  * to 0.
1135  */
1136 long
1137 tor_parse_long(const char *s, int base, long min, long max,
1138                int *ok, char **next)
1139 {
1140   char *endptr;
1141   long r;
1142
1143   if (base < 0) {
1144     if (ok)
1145       *ok = 0;
1146     return 0;
1147   }
1148
1149   errno = 0;
1150   r = strtol(s, &endptr, base);
1151   CHECK_STRTOX_RESULT();
1152 }
1153
1154 /** As tor_parse_long(), but return an unsigned long. */
1155 unsigned long
1156 tor_parse_ulong(const char *s, int base, unsigned long min,
1157                 unsigned long max, int *ok, char **next)
1158 {
1159   char *endptr;
1160   unsigned long r;
1161
1162   if (base < 0) {
1163     if (ok)
1164       *ok = 0;
1165     return 0;
1166   }
1167
1168   errno = 0;
1169   r = strtoul(s, &endptr, base);
1170   CHECK_STRTOX_RESULT();
1171 }
1172
1173 /** As tor_parse_long(), but return a double. */
1174 double
1175 tor_parse_double(const char *s, double min, double max, int *ok, char **next)
1176 {
1177   char *endptr;
1178   double r;
1179
1180   errno = 0;
1181   r = strtod(s, &endptr);
1182   CHECK_STRTOX_RESULT();
1183 }
1184
1185 /** As tor_parse_long, but return a uint64_t.  Only base 10 is guaranteed to
1186  * work for now. */
1187 uint64_t
1188 tor_parse_uint64(const char *s, int base, uint64_t min,
1189                  uint64_t max, int *ok, char **next)
1190 {
1191   char *endptr;
1192   uint64_t r;
1193
1194   if (base < 0) {
1195     if (ok)
1196       *ok = 0;
1197     return 0;
1198   }
1199
1200   errno = 0;
1201 #ifdef HAVE_STRTOULL
1202   r = (uint64_t)strtoull(s, &endptr, base);
1203 #elif defined(_WIN32)
1204 #if defined(_MSC_VER) && _MSC_VER < 1300
1205   tor_assert(base <= 10);
1206   r = (uint64_t)_atoi64(s);
1207   endptr = (char*)s;
1208   while (TOR_ISSPACE(*endptr)) endptr++;
1209   while (TOR_ISDIGIT(*endptr)) endptr++;
1210 #else
1211   r = (uint64_t)_strtoui64(s, &endptr, base);
1212 #endif
1213 #elif SIZEOF_LONG == 8
1214   r = (uint64_t)strtoul(s, &endptr, base);
1215 #else
1216 #error "I don't know how to parse 64-bit numbers."
1217 #endif
1218
1219   CHECK_STRTOX_RESULT();
1220 }
1221
1222 /** Encode the <b>srclen</b> bytes at <b>src</b> in a NUL-terminated,
1223  * uppercase hexadecimal string; store it in the <b>destlen</b>-byte buffer
1224  * <b>dest</b>.
1225  */
1226 void
1227 base16_encode(char *dest, size_t destlen, const char *src, size_t srclen)
1228 {
1229   const char *end;
1230   char *cp;
1231
1232   tor_assert(destlen >= srclen*2+1);
1233   tor_assert(destlen < SIZE_T_CEILING);
1234
1235   cp = dest;
1236   end = src+srclen;
1237   while (src<end) {
1238     *cp++ = "0123456789ABCDEF"[ (*(const uint8_t*)src) >> 4 ];
1239     *cp++ = "0123456789ABCDEF"[ (*(const uint8_t*)src) & 0xf ];
1240     ++src;
1241   }
1242   *cp = '\0';
1243 }
1244
1245 /** Helper: given a hex digit, return its value, or -1 if it isn't hex. */
1246 static INLINE int
1247 hex_decode_digit_(char c)
1248 {
1249   switch (c) {
1250     case '0': return 0;
1251     case '1': return 1;
1252     case '2': return 2;
1253     case '3': return 3;
1254     case '4': return 4;
1255     case '5': return 5;
1256     case '6': return 6;
1257     case '7': return 7;
1258     case '8': return 8;
1259     case '9': return 9;
1260     case 'A': case 'a': return 10;
1261     case 'B': case 'b': return 11;
1262     case 'C': case 'c': return 12;
1263     case 'D': case 'd': return 13;
1264     case 'E': case 'e': return 14;
1265     case 'F': case 'f': return 15;
1266     default:
1267       return -1;
1268   }
1269 }
1270
1271 /** Helper: given a hex digit, return its value, or -1 if it isn't hex. */
1272 int
1273 hex_decode_digit(char c)
1274 {
1275   return hex_decode_digit_(c);
1276 }
1277
1278 /** Given a hexadecimal string of <b>srclen</b> bytes in <b>src</b>, decode it
1279  * and store the result in the <b>destlen</b>-byte buffer at <b>dest</b>.
1280  * Return 0 on success, -1 on failure. */
1281 int
1282 base16_decode(char *dest, size_t destlen, const char *src, size_t srclen)
1283 {
1284   const char *end;
1285
1286   int v1,v2;
1287   if ((srclen % 2) != 0)
1288     return -1;
1289   if (destlen < srclen/2 || destlen > SIZE_T_CEILING)
1290     return -1;
1291
1292   memset(dest, 0, destlen);
1293
1294   end = src+srclen;
1295   while (src<end) {
1296     v1 = hex_decode_digit_(*src);
1297     v2 = hex_decode_digit_(*(src+1));
1298     if (v1<0||v2<0)
1299       return -1;
1300     *(uint8_t*)dest = (v1<<4)|v2;
1301     ++dest;
1302     src+=2;
1303   }
1304   return 0;
1305 }
1306
1307 /** Allocate and return a new string representing the contents of <b>s</b>,
1308  * surrounded by quotes and using standard C escapes.
1309  *
1310  * Generally, we use this for logging values that come in over the network to
1311  * keep them from tricking users, and for sending certain values to the
1312  * controller.
1313  *
1314  * We trust values from the resolver, OS, configuration file, and command line
1315  * to not be maliciously ill-formed.  We validate incoming routerdescs and
1316  * SOCKS requests and addresses from BEGIN cells as they're parsed;
1317  * afterwards, we trust them as non-malicious.
1318  */
1319 char *
1320 esc_for_log(const char *s)
1321 {
1322   const char *cp;
1323   char *result, *outp;
1324   size_t len = 3;
1325   if (!s) {
1326     return tor_strdup("(null)");
1327   }
1328
1329   for (cp = s; *cp; ++cp) {
1330     switch (*cp) {
1331       case '\\':
1332       case '\"':
1333       case '\'':
1334       case '\r':
1335       case '\n':
1336       case '\t':
1337         len += 2;
1338         break;
1339       default:
1340         if (TOR_ISPRINT(*cp) && ((uint8_t)*cp)<127)
1341           ++len;
1342         else
1343           len += 4;
1344         break;
1345     }
1346   }
1347
1348   tor_assert(len <= SSIZE_MAX);
1349
1350   result = outp = tor_malloc(len);
1351   *outp++ = '\"';
1352   for (cp = s; *cp; ++cp) {
1353     /* This assertion should always succeed, since we will write at least
1354      * one char here, and two chars for closing quote and nul later */
1355     tor_assert((outp-result) < (ssize_t)len-2);
1356     switch (*cp) {
1357       case '\\':
1358       case '\"':
1359       case '\'':
1360         *outp++ = '\\';
1361         *outp++ = *cp;
1362         break;
1363       case '\n':
1364         *outp++ = '\\';
1365         *outp++ = 'n';
1366         break;
1367       case '\t':
1368         *outp++ = '\\';
1369         *outp++ = 't';
1370         break;
1371       case '\r':
1372         *outp++ = '\\';
1373         *outp++ = 'r';
1374         break;
1375       default:
1376         if (TOR_ISPRINT(*cp) && ((uint8_t)*cp)<127) {
1377           *outp++ = *cp;
1378         } else {
1379           tor_assert((outp-result) < (ssize_t)len-4);
1380           tor_snprintf(outp, 5, "\\%03o", (int)(uint8_t) *cp);
1381           outp += 4;
1382         }
1383         break;
1384     }
1385   }
1386
1387   tor_assert((outp-result) <= (ssize_t)len-2);
1388   *outp++ = '\"';
1389   *outp++ = 0;
1390
1391   return result;
1392 }
1393
1394 /** Similar to esc_for_log. Allocate and return a new string representing
1395  * the first n characters in <b>chars</b>, surround by quotes and using
1396  * standard C escapes. If a NUL character is encountered in <b>chars</b>,
1397  * the resulting string will be terminated there.
1398  */
1399 char *
1400 esc_for_log_len(const char *chars, size_t n)
1401 {
1402   char *string = tor_strndup(chars, n);
1403   char *string_escaped = esc_for_log(string);
1404   tor_free(string);
1405   return string_escaped;
1406 }
1407
1408 /** Allocate and return a new string representing the contents of <b>s</b>,
1409  * surrounded by quotes and using standard C escapes.
1410  *
1411  * THIS FUNCTION IS NOT REENTRANT.  Don't call it from outside the main
1412  * thread.  Also, each call invalidates the last-returned value, so don't
1413  * try log_warn(LD_GENERAL, "%s %s", escaped(a), escaped(b));
1414  */
1415 const char *
1416 escaped(const char *s)
1417 {
1418   static char *escaped_val_ = NULL;
1419   tor_free(escaped_val_);
1420
1421   if (s)
1422     escaped_val_ = esc_for_log(s);
1423   else
1424     escaped_val_ = NULL;
1425
1426   return escaped_val_;
1427 }
1428
1429 /** Return a newly allocated string equal to <b>string</b>, except that every
1430  * character in <b>chars_to_escape</b> is preceded by a backslash. */
1431 char *
1432 tor_escape_str_for_pt_args(const char *string, const char *chars_to_escape)
1433 {
1434   char *new_string = NULL;
1435   char *new_cp = NULL;
1436   size_t length, new_length;
1437
1438   tor_assert(string);
1439
1440   length = strlen(string);
1441
1442   if (!length) /* If we were given the empty string, return the same. */
1443     return tor_strdup("");
1444   /* (new_length > SIZE_MAX) => ((length * 2) + 1 > SIZE_MAX) =>
1445      (length*2 > SIZE_MAX - 1) => (length > (SIZE_MAX - 1)/2) */
1446   if (length > (SIZE_MAX - 1)/2) /* check for overflow */
1447     return NULL;
1448
1449   /* this should be enough even if all characters must be escaped */
1450   new_length = (length * 2) + 1;
1451
1452   new_string = new_cp = tor_malloc(new_length);
1453
1454   while (*string) {
1455     if (strchr(chars_to_escape, *string))
1456       *new_cp++ = '\\';
1457
1458     *new_cp++ = *string++;
1459   }
1460
1461   *new_cp = '\0'; /* NUL-terminate the new string */
1462
1463   return new_string;
1464 }
1465
1466 /* =====
1467  * Time
1468  * ===== */
1469
1470 /** Return the number of microseconds elapsed between *start and *end.
1471  */
1472 long
1473 tv_udiff(const struct timeval *start, const struct timeval *end)
1474 {
1475   long udiff;
1476   long secdiff = end->tv_sec - start->tv_sec;
1477
1478   if (labs(secdiff+1) > LONG_MAX/1000000) {
1479     log_warn(LD_GENERAL, "comparing times on microsecond detail too far "
1480              "apart: %ld seconds", secdiff);
1481     return LONG_MAX;
1482   }
1483
1484   udiff = secdiff*1000000L + (end->tv_usec - start->tv_usec);
1485   return udiff;
1486 }
1487
1488 /** Return the number of milliseconds elapsed between *start and *end.
1489  */
1490 long
1491 tv_mdiff(const struct timeval *start, const struct timeval *end)
1492 {
1493   long mdiff;
1494   long secdiff = end->tv_sec - start->tv_sec;
1495
1496   if (labs(secdiff+1) > LONG_MAX/1000) {
1497     log_warn(LD_GENERAL, "comparing times on millisecond detail too far "
1498              "apart: %ld seconds", secdiff);
1499     return LONG_MAX;
1500   }
1501
1502   /* Subtract and round */
1503   mdiff = secdiff*1000L +
1504       ((long)end->tv_usec - (long)start->tv_usec + 500L) / 1000L;
1505   return mdiff;
1506 }
1507
1508 /**
1509  * Converts timeval to milliseconds.
1510  */
1511 int64_t
1512 tv_to_msec(const struct timeval *tv)
1513 {
1514   int64_t conv = ((int64_t)tv->tv_sec)*1000L;
1515   /* Round ghetto-style */
1516   conv += ((int64_t)tv->tv_usec+500)/1000L;
1517   return conv;
1518 }
1519
1520 /** Yield true iff <b>y</b> is a leap-year. */
1521 #define IS_LEAPYEAR(y) (!(y % 4) && ((y % 100) || !(y % 400)))
1522 /** Helper: Return the number of leap-days between Jan 1, y1 and Jan 1, y2. */
1523 static int
1524 n_leapdays(int y1, int y2)
1525 {
1526   --y1;
1527   --y2;
1528   return (y2/4 - y1/4) - (y2/100 - y1/100) + (y2/400 - y1/400);
1529 }
1530 /** Number of days per month in non-leap year; used by tor_timegm and
1531  * parse_rfc1123_time. */
1532 static const int days_per_month[] =
1533   { 31, 28, 31, 30, 31, 30, 31, 31, 30, 31, 30, 31};
1534
1535 /** Compute a time_t given a struct tm.  The result is given in UTC, and
1536  * does not account for leap seconds.  Return 0 on success, -1 on failure.
1537  */
1538 int
1539 tor_timegm(const struct tm *tm, time_t *time_out)
1540 {
1541   /* This is a pretty ironclad timegm implementation, snarfed from Python2.2.
1542    * It's way more brute-force than fiddling with tzset().
1543    */
1544   time_t year, days, hours, minutes, seconds;
1545   int i, invalid_year, dpm;
1546   /* avoid int overflow on addition */
1547   if (tm->tm_year < INT32_MAX-1900) {
1548     year = tm->tm_year + 1900;
1549   } else {
1550     /* clamp year */
1551     year = INT32_MAX;
1552   }
1553   invalid_year = (year < 1970 || tm->tm_year >= INT32_MAX-1900);
1554
1555   if (tm->tm_mon >= 0 && tm->tm_mon <= 11) {
1556     dpm = days_per_month[tm->tm_mon];
1557     if (tm->tm_mon == 1 && !invalid_year && IS_LEAPYEAR(tm->tm_year)) {
1558       dpm = 29;
1559     }
1560   } else {
1561     /* invalid month - default to 0 days per month */
1562     dpm = 0;
1563   }
1564
1565   if (invalid_year ||
1566       tm->tm_mon < 0 || tm->tm_mon > 11 ||
1567       tm->tm_mday < 1 || tm->tm_mday > dpm ||
1568       tm->tm_hour < 0 || tm->tm_hour > 23 ||
1569       tm->tm_min < 0 || tm->tm_min > 59 ||
1570       tm->tm_sec < 0 || tm->tm_sec > 60) {
1571     log_warn(LD_BUG, "Out-of-range argument to tor_timegm");
1572     return -1;
1573   }
1574   days = 365 * (year-1970) + n_leapdays(1970,(int)year);
1575   for (i = 0; i < tm->tm_mon; ++i)
1576     days += days_per_month[i];
1577   if (tm->tm_mon > 1 && IS_LEAPYEAR(year))
1578     ++days;
1579   days += tm->tm_mday - 1;
1580   hours = days*24 + tm->tm_hour;
1581
1582   minutes = hours*60 + tm->tm_min;
1583   seconds = minutes*60 + tm->tm_sec;
1584   *time_out = seconds;
1585   return 0;
1586 }
1587
1588 /* strftime is locale-specific, so we need to replace those parts */
1589
1590 /** A c-locale array of 3-letter names of weekdays, starting with Sun. */
1591 static const char *WEEKDAY_NAMES[] =
1592   { "Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat" };
1593 /** A c-locale array of 3-letter names of months, starting with Jan. */
1594 static const char *MONTH_NAMES[] =
1595   { "Jan", "Feb", "Mar", "Apr", "May", "Jun",
1596     "Jul", "Aug", "Sep", "Oct", "Nov", "Dec" };
1597
1598 /** Set <b>buf</b> to the RFC1123 encoding of the UTC value of <b>t</b>.
1599  * The buffer must be at least RFC1123_TIME_LEN+1 bytes long.
1600  *
1601  * (RFC1123 format is "Fri, 29 Sep 2006 15:54:20 GMT". Note the "GMT"
1602  * rather than "UTC".)
1603  */
1604 void
1605 format_rfc1123_time(char *buf, time_t t)
1606 {
1607   struct tm tm;
1608
1609   tor_gmtime_r(&t, &tm);
1610
1611   strftime(buf, RFC1123_TIME_LEN+1, "___, %d ___ %Y %H:%M:%S GMT", &tm);
1612   tor_assert(tm.tm_wday >= 0);
1613   tor_assert(tm.tm_wday <= 6);
1614   memcpy(buf, WEEKDAY_NAMES[tm.tm_wday], 3);
1615   tor_assert(tm.tm_mon >= 0);
1616   tor_assert(tm.tm_mon <= 11);
1617   memcpy(buf+8, MONTH_NAMES[tm.tm_mon], 3);
1618 }
1619
1620 /** Parse the (a subset of) the RFC1123 encoding of some time (in UTC) from
1621  * <b>buf</b>, and store the result in *<b>t</b>.
1622  *
1623  * Note that we only accept the subset generated by format_rfc1123_time above,
1624  * not the full range of formats suggested by RFC 1123.
1625  *
1626  * Return 0 on success, -1 on failure.
1627 */
1628 int
1629 parse_rfc1123_time(const char *buf, time_t *t)
1630 {
1631   struct tm tm;
1632   char month[4];
1633   char weekday[4];
1634   int i, m, invalid_year;
1635   unsigned tm_mday, tm_year, tm_hour, tm_min, tm_sec;
1636   unsigned dpm;
1637
1638   if (strlen(buf) != RFC1123_TIME_LEN)
1639     return -1;
1640   memset(&tm, 0, sizeof(tm));
1641   if (tor_sscanf(buf, "%3s, %2u %3s %u %2u:%2u:%2u GMT", weekday,
1642              &tm_mday, month, &tm_year, &tm_hour,
1643              &tm_min, &tm_sec) < 7) {
1644     char *esc = esc_for_log(buf);
1645     log_warn(LD_GENERAL, "Got invalid RFC1123 time %s", esc);
1646     tor_free(esc);
1647     return -1;
1648   }
1649
1650   m = -1;
1651   for (i = 0; i < 12; ++i) {
1652     if (!strcmp(month, MONTH_NAMES[i])) {
1653       m = i;
1654       break;
1655     }
1656   }
1657   if (m<0) {
1658     char *esc = esc_for_log(buf);
1659     log_warn(LD_GENERAL, "Got invalid RFC1123 time %s: No such month", esc);
1660     tor_free(esc);
1661     return -1;
1662   }
1663   tm.tm_mon = m;
1664
1665   invalid_year = (tm_year >= INT32_MAX || tm_year < 1970);
1666   tor_assert(m >= 0 && m <= 11);
1667   dpm = days_per_month[m];
1668   if (m == 1 && !invalid_year && IS_LEAPYEAR(tm_year)) {
1669     dpm = 29;
1670   }
1671
1672   if (invalid_year || tm_mday < 1 || tm_mday > dpm ||
1673       tm_hour > 23 || tm_min > 59 || tm_sec > 60) {
1674     char *esc = esc_for_log(buf);
1675     log_warn(LD_GENERAL, "Got invalid RFC1123 time %s", esc);
1676     tor_free(esc);
1677     return -1;
1678   }
1679   tm.tm_mday = (int)tm_mday;
1680   tm.tm_year = (int)tm_year;
1681   tm.tm_hour = (int)tm_hour;
1682   tm.tm_min = (int)tm_min;
1683   tm.tm_sec = (int)tm_sec;
1684
1685   if (tm.tm_year < 1970) {
1686     char *esc = esc_for_log(buf);
1687     log_warn(LD_GENERAL,
1688              "Got invalid RFC1123 time %s. (Before 1970)", esc);
1689     tor_free(esc);
1690     return -1;
1691   }
1692   tm.tm_year -= 1900;
1693
1694   return tor_timegm(&tm, t);
1695 }
1696
1697 /** Set <b>buf</b> to the ISO8601 encoding of the local value of <b>t</b>.
1698  * The buffer must be at least ISO_TIME_LEN+1 bytes long.
1699  *
1700  * (ISO8601 format is 2006-10-29 10:57:20)
1701  */
1702 void
1703 format_local_iso_time(char *buf, time_t t)
1704 {
1705   struct tm tm;
1706   strftime(buf, ISO_TIME_LEN+1, "%Y-%m-%d %H:%M:%S", tor_localtime_r(&t, &tm));
1707 }
1708
1709 /** Set <b>buf</b> to the ISO8601 encoding of the GMT value of <b>t</b>.
1710  * The buffer must be at least ISO_TIME_LEN+1 bytes long.
1711  */
1712 void
1713 format_iso_time(char *buf, time_t t)
1714 {
1715   struct tm tm;
1716   strftime(buf, ISO_TIME_LEN+1, "%Y-%m-%d %H:%M:%S", tor_gmtime_r(&t, &tm));
1717 }
1718
1719 /** As format_iso_time, but use the yyyy-mm-ddThh:mm:ss format to avoid
1720  * embedding an internal space. */
1721 void
1722 format_iso_time_nospace(char *buf, time_t t)
1723 {
1724   format_iso_time(buf, t);
1725   buf[10] = 'T';
1726 }
1727
1728 /** As format_iso_time_nospace, but include microseconds in decimal
1729  * fixed-point format.  Requires that buf be at least ISO_TIME_USEC_LEN+1
1730  * bytes long. */
1731 void
1732 format_iso_time_nospace_usec(char *buf, const struct timeval *tv)
1733 {
1734   tor_assert(tv);
1735   format_iso_time_nospace(buf, (time_t)tv->tv_sec);
1736   tor_snprintf(buf+ISO_TIME_LEN, 8, ".%06d", (int)tv->tv_usec);
1737 }
1738
1739 /** Given an ISO-formatted UTC time value (after the epoch) in <b>cp</b>,
1740  * parse it and store its value in *<b>t</b>.  Return 0 on success, -1 on
1741  * failure.  Ignore extraneous stuff in <b>cp</b> after the end of the time
1742  * string, unless <b>strict</b> is set. */
1743 int
1744 parse_iso_time_(const char *cp, time_t *t, int strict)
1745 {
1746   struct tm st_tm;
1747   unsigned int year=0, month=0, day=0, hour=0, minute=0, second=0;
1748   int n_fields;
1749   char extra_char;
1750   n_fields = tor_sscanf(cp, "%u-%2u-%2u %2u:%2u:%2u%c", &year, &month,
1751                         &day, &hour, &minute, &second, &extra_char);
1752   if (strict ? (n_fields != 6) : (n_fields < 6)) {
1753     char *esc = esc_for_log(cp);
1754     log_warn(LD_GENERAL, "ISO time %s was unparseable", esc);
1755     tor_free(esc);
1756     return -1;
1757   }
1758   if (year < 1970 || month < 1 || month > 12 || day < 1 || day > 31 ||
1759           hour > 23 || minute > 59 || second > 60 || year >= INT32_MAX) {
1760     char *esc = esc_for_log(cp);
1761     log_warn(LD_GENERAL, "ISO time %s was nonsensical", esc);
1762     tor_free(esc);
1763     return -1;
1764   }
1765   st_tm.tm_year = (int)year-1900;
1766   st_tm.tm_mon = month-1;
1767   st_tm.tm_mday = day;
1768   st_tm.tm_hour = hour;
1769   st_tm.tm_min = minute;
1770   st_tm.tm_sec = second;
1771
1772   if (st_tm.tm_year < 70) {
1773     char *esc = esc_for_log(cp);
1774     log_warn(LD_GENERAL, "Got invalid ISO time %s. (Before 1970)", esc);
1775     tor_free(esc);
1776     return -1;
1777   }
1778   return tor_timegm(&st_tm, t);
1779 }
1780
1781 /** Given an ISO-formatted UTC time value (after the epoch) in <b>cp</b>,
1782  * parse it and store its value in *<b>t</b>.  Return 0 on success, -1 on
1783  * failure. Reject the string if any characters are present after the time.
1784  */
1785 int
1786 parse_iso_time(const char *cp, time_t *t)
1787 {
1788   return parse_iso_time_(cp, t, 1);
1789 }
1790
1791 /** Given a <b>date</b> in one of the three formats allowed by HTTP (ugh),
1792  * parse it into <b>tm</b>.  Return 0 on success, negative on failure. */
1793 int
1794 parse_http_time(const char *date, struct tm *tm)
1795 {
1796   const char *cp;
1797   char month[4];
1798   char wkday[4];
1799   int i;
1800   unsigned tm_mday, tm_year, tm_hour, tm_min, tm_sec;
1801
1802   tor_assert(tm);
1803   memset(tm, 0, sizeof(*tm));
1804
1805   /* First, try RFC1123 or RFC850 format: skip the weekday.  */
1806   if ((cp = strchr(date, ','))) {
1807     ++cp;
1808     if (*cp != ' ')
1809       return -1;
1810     ++cp;
1811     if (tor_sscanf(cp, "%2u %3s %4u %2u:%2u:%2u GMT",
1812                &tm_mday, month, &tm_year,
1813                &tm_hour, &tm_min, &tm_sec) == 6) {
1814       /* rfc1123-date */
1815       tm_year -= 1900;
1816     } else if (tor_sscanf(cp, "%2u-%3s-%2u %2u:%2u:%2u GMT",
1817                       &tm_mday, month, &tm_year,
1818                       &tm_hour, &tm_min, &tm_sec) == 6) {
1819       /* rfc850-date */
1820     } else {
1821       return -1;
1822     }
1823   } else {
1824     /* No comma; possibly asctime() format. */
1825     if (tor_sscanf(date, "%3s %3s %2u %2u:%2u:%2u %4u",
1826                wkday, month, &tm_mday,
1827                &tm_hour, &tm_min, &tm_sec, &tm_year) == 7) {
1828       tm_year -= 1900;
1829     } else {
1830       return -1;
1831     }
1832   }
1833   tm->tm_mday = (int)tm_mday;
1834   tm->tm_year = (int)tm_year;
1835   tm->tm_hour = (int)tm_hour;
1836   tm->tm_min = (int)tm_min;
1837   tm->tm_sec = (int)tm_sec;
1838
1839   month[3] = '\0';
1840   /* Okay, now decode the month. */
1841   /* set tm->tm_mon to dummy value so the check below fails. */
1842   tm->tm_mon = -1;
1843   for (i = 0; i < 12; ++i) {
1844     if (!strcasecmp(MONTH_NAMES[i], month)) {
1845       tm->tm_mon = i;
1846     }
1847   }
1848
1849   if (tm->tm_year < 0 ||
1850       tm->tm_mon < 0  || tm->tm_mon > 11 ||
1851       tm->tm_mday < 1 || tm->tm_mday > 31 ||
1852       tm->tm_hour < 0 || tm->tm_hour > 23 ||
1853       tm->tm_min < 0  || tm->tm_min > 59 ||
1854       tm->tm_sec < 0  || tm->tm_sec > 60)
1855     return -1; /* Out of range, or bad month. */
1856
1857   return 0;
1858 }
1859
1860 /** Given an <b>interval</b> in seconds, try to write it to the
1861  * <b>out_len</b>-byte buffer in <b>out</b> in a human-readable form.
1862  * Return 0 on success, -1 on failure.
1863  */
1864 int
1865 format_time_interval(char *out, size_t out_len, long interval)
1866 {
1867   /* We only report seconds if there's no hours. */
1868   long sec = 0, min = 0, hour = 0, day = 0;
1869
1870   /* -LONG_MIN is LONG_MAX + 1, which causes signed overflow */
1871   if (interval < -LONG_MAX)
1872     interval = LONG_MAX;
1873   else if (interval < 0)
1874     interval = -interval;
1875
1876   if (interval >= 86400) {
1877     day = interval / 86400;
1878     interval %= 86400;
1879   }
1880   if (interval >= 3600) {
1881     hour = interval / 3600;
1882     interval %= 3600;
1883   }
1884   if (interval >= 60) {
1885     min = interval / 60;
1886     interval %= 60;
1887   }
1888   sec = interval;
1889
1890   if (day) {
1891     return tor_snprintf(out, out_len, "%ld days, %ld hours, %ld minutes",
1892                         day, hour, min);
1893   } else if (hour) {
1894     return tor_snprintf(out, out_len, "%ld hours, %ld minutes", hour, min);
1895   } else if (min) {
1896     return tor_snprintf(out, out_len, "%ld minutes, %ld seconds", min, sec);
1897   } else {
1898     return tor_snprintf(out, out_len, "%ld seconds", sec);
1899   }
1900 }
1901
1902 /* =====
1903  * Cached time
1904  * ===== */
1905
1906 #ifndef TIME_IS_FAST
1907 /** Cached estimate of the current time.  Updated around once per second;
1908  * may be a few seconds off if we are really busy.  This is a hack to avoid
1909  * calling time(NULL) (which not everybody has optimized) on critical paths.
1910  */
1911 static time_t cached_approx_time = 0;
1912
1913 /** Return a cached estimate of the current time from when
1914  * update_approx_time() was last called.  This is a hack to avoid calling
1915  * time(NULL) on critical paths: please do not even think of calling it
1916  * anywhere else. */
1917 time_t
1918 approx_time(void)
1919 {
1920   return cached_approx_time;
1921 }
1922
1923 /** Update the cached estimate of the current time.  This function SHOULD be
1924  * called once per second, and MUST be called before the first call to
1925  * get_approx_time. */
1926 void
1927 update_approx_time(time_t now)
1928 {
1929   cached_approx_time = now;
1930 }
1931 #endif
1932
1933 /* =====
1934  * Rate limiting
1935  * ===== */
1936
1937 /** If the rate-limiter <b>lim</b> is ready at <b>now</b>, return the number
1938  * of calls to rate_limit_is_ready (including this one!) since the last time
1939  * rate_limit_is_ready returned nonzero.  Otherwise return 0. */
1940 static int
1941 rate_limit_is_ready(ratelim_t *lim, time_t now)
1942 {
1943   if (lim->rate + lim->last_allowed <= now) {
1944     int res = lim->n_calls_since_last_time + 1;
1945     lim->last_allowed = now;
1946     lim->n_calls_since_last_time = 0;
1947     return res;
1948   } else {
1949     ++lim->n_calls_since_last_time;
1950     return 0;
1951   }
1952 }
1953
1954 /** If the rate-limiter <b>lim</b> is ready at <b>now</b>, return a newly
1955  * allocated string indicating how many messages were suppressed, suitable to
1956  * append to a log message.  Otherwise return NULL. */
1957 char *
1958 rate_limit_log(ratelim_t *lim, time_t now)
1959 {
1960   int n;
1961   if ((n = rate_limit_is_ready(lim, now))) {
1962     if (n == 1) {
1963       return tor_strdup("");
1964     } else {
1965       char *cp=NULL;
1966       tor_asprintf(&cp,
1967                    " [%d similar message(s) suppressed in last %d seconds]",
1968                    n-1, lim->rate);
1969       return cp;
1970     }
1971   } else {
1972     return NULL;
1973   }
1974 }
1975
1976 /* =====
1977  * File helpers
1978  * ===== */
1979
1980 /** Write <b>count</b> bytes from <b>buf</b> to <b>fd</b>.  <b>isSocket</b>
1981  * must be 1 if fd was returned by socket() or accept(), and 0 if fd
1982  * was returned by open().  Return the number of bytes written, or -1
1983  * on error.  Only use if fd is a blocking fd.  */
1984 ssize_t
1985 write_all(tor_socket_t fd, const char *buf, size_t count, int isSocket)
1986 {
1987   size_t written = 0;
1988   ssize_t result;
1989   tor_assert(count < SSIZE_MAX);
1990
1991   while (written != count) {
1992     if (isSocket)
1993       result = tor_socket_send(fd, buf+written, count-written, 0);
1994     else
1995       result = write((int)fd, buf+written, count-written);
1996     if (result<0)
1997       return -1;
1998     written += result;
1999   }
2000   return (ssize_t)count;
2001 }
2002
2003 /** Read from <b>fd</b> to <b>buf</b>, until we get <b>count</b> bytes
2004  * or reach the end of the file. <b>isSocket</b> must be 1 if fd
2005  * was returned by socket() or accept(), and 0 if fd was returned by
2006  * open().  Return the number of bytes read, or -1 on error. Only use
2007  * if fd is a blocking fd. */
2008 ssize_t
2009 read_all(tor_socket_t fd, char *buf, size_t count, int isSocket)
2010 {
2011   size_t numread = 0;
2012   ssize_t result;
2013
2014   if (count > SIZE_T_CEILING || count > SSIZE_MAX)
2015     return -1;
2016
2017   while (numread != count) {
2018     if (isSocket)
2019       result = tor_socket_recv(fd, buf+numread, count-numread, 0);
2020     else
2021       result = read((int)fd, buf+numread, count-numread);
2022     if (result<0)
2023       return -1;
2024     else if (result == 0)
2025       break;
2026     numread += result;
2027   }
2028   return (ssize_t)numread;
2029 }
2030
2031 /*
2032  *    Filesystem operations.
2033  */
2034
2035 /** Clean up <b>name</b> so that we can use it in a call to "stat".  On Unix,
2036  * we do nothing.  On Windows, we remove a trailing slash, unless the path is
2037  * the root of a disk. */
2038 static void
2039 clean_name_for_stat(char *name)
2040 {
2041 #ifdef _WIN32
2042   size_t len = strlen(name);
2043   if (!len)
2044     return;
2045   if (name[len-1]=='\\' || name[len-1]=='/') {
2046     if (len == 1 || (len==3 && name[1]==':'))
2047       return;
2048     name[len-1]='\0';
2049   }
2050 #else
2051   (void)name;
2052 #endif
2053 }
2054
2055 /** Return:
2056  * FN_ERROR if filename can't be read, is NULL, or is zero-length,
2057  * FN_NOENT if it doesn't exist,
2058  * FN_FILE if it is a non-empty regular file, or a FIFO on unix-like systems,
2059  * FN_EMPTY for zero-byte regular files,
2060  * FN_DIR if it's a directory, and
2061  * FN_ERROR for any other file type.
2062  * On FN_ERROR and FN_NOENT, sets errno.  (errno is not set when FN_ERROR
2063  * is returned due to an unhandled file type.) */
2064 file_status_t
2065 file_status(const char *fname)
2066 {
2067   struct stat st;
2068   char *f;
2069   int r;
2070   if (!fname || strlen(fname) == 0) {
2071     return FN_ERROR;
2072   }
2073   f = tor_strdup(fname);
2074   clean_name_for_stat(f);
2075   log_debug(LD_FS, "stat()ing %s", f);
2076   r = stat(sandbox_intern_string(f), &st);
2077   tor_free(f);
2078   if (r) {
2079     if (errno == ENOENT) {
2080       return FN_NOENT;
2081     }
2082     return FN_ERROR;
2083   }
2084   if (st.st_mode & S_IFDIR) {
2085     return FN_DIR;
2086   } else if (st.st_mode & S_IFREG) {
2087     if (st.st_size > 0) {
2088       return FN_FILE;
2089     } else if (st.st_size == 0) {
2090       return FN_EMPTY;
2091     } else {
2092       return FN_ERROR;
2093     }
2094 #ifndef _WIN32
2095   } else if (st.st_mode & S_IFIFO) {
2096     return FN_FILE;
2097 #endif
2098   } else {
2099     return FN_ERROR;
2100   }
2101 }
2102
2103 /** Check whether <b>dirname</b> exists and is private.  If yes return 0.  If
2104  * it does not exist, and <b>check</b>&CPD_CREATE is set, try to create it
2105  * and return 0 on success. If it does not exist, and
2106  * <b>check</b>&CPD_CHECK, and we think we can create it, return 0.  Else
2107  * return -1.  If CPD_GROUP_OK is set, then it's okay if the directory
2108  * is group-readable, but in all cases we create the directory mode 0700.
2109  * If CPD_GROUP_READ is set, existing directory behaves as CPD_GROUP_OK and
2110  * if the directory is created it will use mode 0750 with group read
2111  * permission. Group read privileges also assume execute permission
2112  * as norm for directories. If CPD_CHECK_MODE_ONLY is set, then we don't
2113  * alter the directory permissions if they are too permissive:
2114  * we just return -1.
2115  * When effective_user is not NULL, check permissions against the given user
2116  * and its primary group.
2117  */
2118 int
2119 check_private_dir(const char *dirname, cpd_check_t check,
2120                   const char *effective_user)
2121 {
2122   int r;
2123   struct stat st;
2124   char *f;
2125 #ifndef _WIN32
2126   unsigned unwanted_bits = 0;
2127   const struct passwd *pw = NULL;
2128   uid_t running_uid;
2129   gid_t running_gid;
2130 #else
2131   (void)effective_user;
2132 #endif
2133
2134   tor_assert(dirname);
2135   f = tor_strdup(dirname);
2136   clean_name_for_stat(f);
2137   log_debug(LD_FS, "stat()ing %s", f);
2138   r = stat(sandbox_intern_string(f), &st);
2139   tor_free(f);
2140   if (r) {
2141     if (errno != ENOENT) {
2142       log_warn(LD_FS, "Directory %s cannot be read: %s", dirname,
2143                strerror(errno));
2144       return -1;
2145     }
2146     if (check & CPD_CREATE) {
2147       log_info(LD_GENERAL, "Creating directory %s", dirname);
2148 #if defined (_WIN32)
2149       r = mkdir(dirname);
2150 #else
2151       if (check & CPD_GROUP_READ) {
2152         r = mkdir(dirname, 0750);
2153       } else {
2154         r = mkdir(dirname, 0700);
2155       }
2156 #endif
2157       if (r) {
2158         log_warn(LD_FS, "Error creating directory %s: %s", dirname,
2159             strerror(errno));
2160         return -1;
2161       }
2162     } else if (!(check & CPD_CHECK)) {
2163       log_warn(LD_FS, "Directory %s does not exist.", dirname);
2164       return -1;
2165     }
2166     /* XXXX In the case where check==CPD_CHECK, we should look at the
2167      * parent directory a little harder. */
2168     return 0;
2169   }
2170   if (!(st.st_mode & S_IFDIR)) {
2171     log_warn(LD_FS, "%s is not a directory", dirname);
2172     return -1;
2173   }
2174 #ifndef _WIN32
2175   if (effective_user) {
2176     /* Look up the user and group information.
2177      * If we have a problem, bail out. */
2178     pw = tor_getpwnam(effective_user);
2179     if (pw == NULL) {
2180       log_warn(LD_CONFIG, "Error setting configured user: %s not found",
2181                effective_user);
2182       return -1;
2183     }
2184     running_uid = pw->pw_uid;
2185     running_gid = pw->pw_gid;
2186   } else {
2187     running_uid = getuid();
2188     running_gid = getgid();
2189   }
2190
2191   if (st.st_uid != running_uid) {
2192     const struct passwd *pw = NULL;
2193     char *process_ownername = NULL;
2194
2195     pw = tor_getpwuid(running_uid);
2196     process_ownername = pw ? tor_strdup(pw->pw_name) : tor_strdup("<unknown>");
2197
2198     pw = tor_getpwuid(st.st_uid);
2199
2200     log_warn(LD_FS, "%s is not owned by this user (%s, %d) but by "
2201         "%s (%d). Perhaps you are running Tor as the wrong user?",
2202                          dirname, process_ownername, (int)running_uid,
2203                          pw ? pw->pw_name : "<unknown>", (int)st.st_uid);
2204
2205     tor_free(process_ownername);
2206     return -1;
2207   }
2208   if ( (check & (CPD_GROUP_OK|CPD_GROUP_READ))
2209        && (st.st_gid != running_gid) ) {
2210     struct group *gr;
2211     char *process_groupname = NULL;
2212     gr = getgrgid(running_gid);
2213     process_groupname = gr ? tor_strdup(gr->gr_name) : tor_strdup("<unknown>");
2214     gr = getgrgid(st.st_gid);
2215
2216     log_warn(LD_FS, "%s is not owned by this group (%s, %d) but by group "
2217              "%s (%d).  Are you running Tor as the wrong user?",
2218              dirname, process_groupname, (int)running_gid,
2219              gr ?  gr->gr_name : "<unknown>", (int)st.st_gid);
2220
2221     tor_free(process_groupname);
2222     return -1;
2223   }
2224   if (check & (CPD_GROUP_OK|CPD_GROUP_READ)) {
2225     unwanted_bits = 0027;
2226   } else {
2227     unwanted_bits = 0077;
2228   }
2229   if ((st.st_mode & unwanted_bits) != 0) {
2230     unsigned new_mode;
2231     if (check & CPD_CHECK_MODE_ONLY) {
2232       log_warn(LD_FS, "Permissions on directory %s are too permissive.",
2233                dirname);
2234       return -1;
2235     }
2236     log_warn(LD_FS, "Fixing permissions on directory %s", dirname);
2237     new_mode = st.st_mode;
2238     new_mode |= 0700; /* Owner should have rwx */
2239     if (check & CPD_GROUP_READ) {
2240       new_mode |= 0050; /* Group should have rx */
2241     }
2242     new_mode &= ~unwanted_bits; /* Clear the bits that we didn't want set...*/
2243     if (chmod(dirname, new_mode)) {
2244       log_warn(LD_FS, "Could not chmod directory %s: %s", dirname,
2245                strerror(errno));
2246       return -1;
2247     } else {
2248       return 0;
2249     }
2250   }
2251 #endif
2252   return 0;
2253 }
2254
2255 /** Create a file named <b>fname</b> with the contents <b>str</b>.  Overwrite
2256  * the previous <b>fname</b> if possible.  Return 0 on success, -1 on failure.
2257  *
2258  * This function replaces the old file atomically, if possible.  This
2259  * function, and all other functions in util.c that create files, create them
2260  * with mode 0600.
2261  */
2262 int
2263 write_str_to_file(const char *fname, const char *str, int bin)
2264 {
2265 #ifdef _WIN32
2266   if (!bin && strchr(str, '\r')) {
2267     log_warn(LD_BUG,
2268              "We're writing a text string that already contains a CR to %s",
2269              escaped(fname));
2270   }
2271 #endif
2272   return write_bytes_to_file(fname, str, strlen(str), bin);
2273 }
2274
2275 /** Represents a file that we're writing to, with support for atomic commit:
2276  * we can write into a temporary file, and either remove the file on
2277  * failure, or replace the original file on success. */
2278 struct open_file_t {
2279   char *tempname; /**< Name of the temporary file. */
2280   char *filename; /**< Name of the original file. */
2281   unsigned rename_on_close:1; /**< Are we using the temporary file or not? */
2282   unsigned binary:1; /**< Did we open in binary mode? */
2283   int fd; /**< fd for the open file. */
2284   FILE *stdio_file; /**< stdio wrapper for <b>fd</b>. */
2285 };
2286
2287 /** Try to start writing to the file in <b>fname</b>, passing the flags
2288  * <b>open_flags</b> to the open() syscall, creating the file (if needed) with
2289  * access value <b>mode</b>.  If the O_APPEND flag is set, we append to the
2290  * original file.  Otherwise, we open a new temporary file in the same
2291  * directory, and either replace the original or remove the temporary file
2292  * when we're done.
2293  *
2294  * Return the fd for the newly opened file, and store working data in
2295  * *<b>data_out</b>.  The caller should not close the fd manually:
2296  * instead, call finish_writing_to_file() or abort_writing_to_file().
2297  * Returns -1 on failure.
2298  *
2299  * NOTE: When not appending, the flags O_CREAT and O_TRUNC are treated
2300  * as true and the flag O_EXCL is treated as false.
2301  *
2302  * NOTE: Ordinarily, O_APPEND means "seek to the end of the file before each
2303  * write()".  We don't do that.
2304  */
2305 int
2306 start_writing_to_file(const char *fname, int open_flags, int mode,
2307                       open_file_t **data_out)
2308 {
2309   open_file_t *new_file = tor_malloc_zero(sizeof(open_file_t));
2310   const char *open_name;
2311   int append = 0;
2312
2313   tor_assert(fname);
2314   tor_assert(data_out);
2315 #if (O_BINARY != 0 && O_TEXT != 0)
2316   tor_assert((open_flags & (O_BINARY|O_TEXT)) != 0);
2317 #endif
2318   new_file->fd = -1;
2319   new_file->filename = tor_strdup(fname);
2320   if (open_flags & O_APPEND) {
2321     open_name = fname;
2322     new_file->rename_on_close = 0;
2323     append = 1;
2324     open_flags &= ~O_APPEND;
2325   } else {
2326     tor_asprintf(&new_file->tempname, "%s.tmp", fname);
2327     open_name = new_file->tempname;
2328     /* We always replace an existing temporary file if there is one. */
2329     open_flags |= O_CREAT|O_TRUNC;
2330     open_flags &= ~O_EXCL;
2331     new_file->rename_on_close = 1;
2332   }
2333 #if O_BINARY != 0
2334   if (open_flags & O_BINARY)
2335     new_file->binary = 1;
2336 #endif
2337
2338   new_file->fd = tor_open_cloexec(open_name, open_flags, mode);
2339   if (new_file->fd < 0) {
2340     log_warn(LD_FS, "Couldn't open \"%s\" (%s) for writing: %s",
2341         open_name, fname, strerror(errno));
2342     goto err;
2343   }
2344   if (append) {
2345     if (tor_fd_seekend(new_file->fd) < 0) {
2346       log_warn(LD_FS, "Couldn't seek to end of file \"%s\": %s", open_name,
2347                strerror(errno));
2348       goto err;
2349     }
2350   }
2351
2352   *data_out = new_file;
2353
2354   return new_file->fd;
2355
2356  err:
2357   if (new_file->fd >= 0)
2358     close(new_file->fd);
2359   *data_out = NULL;
2360   tor_free(new_file->filename);
2361   tor_free(new_file->tempname);
2362   tor_free(new_file);
2363   return -1;
2364 }
2365
2366 /** Given <b>file_data</b> from start_writing_to_file(), return a stdio FILE*
2367  * that can be used to write to the same file.  The caller should not mix
2368  * stdio calls with non-stdio calls. */
2369 FILE *
2370 fdopen_file(open_file_t *file_data)
2371 {
2372   tor_assert(file_data);
2373   if (file_data->stdio_file)
2374     return file_data->stdio_file;
2375   tor_assert(file_data->fd >= 0);
2376   if (!(file_data->stdio_file = fdopen(file_data->fd,
2377                                        file_data->binary?"ab":"a"))) {
2378     log_warn(LD_FS, "Couldn't fdopen \"%s\" [%d]: %s", file_data->filename,
2379              file_data->fd, strerror(errno));
2380   }
2381   return file_data->stdio_file;
2382 }
2383
2384 /** Combines start_writing_to_file with fdopen_file(): arguments are as
2385  * for start_writing_to_file, but  */
2386 FILE *
2387 start_writing_to_stdio_file(const char *fname, int open_flags, int mode,
2388                             open_file_t **data_out)
2389 {
2390   FILE *res;
2391   if (start_writing_to_file(fname, open_flags, mode, data_out)<0)
2392     return NULL;
2393   if (!(res = fdopen_file(*data_out))) {
2394     abort_writing_to_file(*data_out);
2395     *data_out = NULL;
2396   }
2397   return res;
2398 }
2399
2400 /** Helper function: close and free the underlying file and memory in
2401  * <b>file_data</b>.  If we were writing into a temporary file, then delete
2402  * that file (if abort_write is true) or replaces the target file with
2403  * the temporary file (if abort_write is false). */
2404 static int
2405 finish_writing_to_file_impl(open_file_t *file_data, int abort_write)
2406 {
2407   int r = 0;
2408
2409   tor_assert(file_data && file_data->filename);
2410   if (file_data->stdio_file) {
2411     if (fclose(file_data->stdio_file)) {
2412       log_warn(LD_FS, "Error closing \"%s\": %s", file_data->filename,
2413                strerror(errno));
2414       abort_write = r = -1;
2415     }
2416   } else if (file_data->fd >= 0 && close(file_data->fd) < 0) {
2417     log_warn(LD_FS, "Error flushing \"%s\": %s", file_data->filename,
2418              strerror(errno));
2419     abort_write = r = -1;
2420   }
2421
2422   if (file_data->rename_on_close) {
2423     tor_assert(file_data->tempname && file_data->filename);
2424     if (abort_write) {
2425       int res = unlink(file_data->tempname);
2426       if (res != 0) {
2427         /* We couldn't unlink and we'll leave a mess behind */
2428         log_warn(LD_FS, "Failed to unlink %s: %s",
2429                  file_data->tempname, strerror(errno));
2430         r = -1;
2431       }
2432     } else {
2433       tor_assert(strcmp(file_data->filename, file_data->tempname));
2434       if (replace_file(file_data->tempname, file_data->filename)) {
2435         log_warn(LD_FS, "Error replacing \"%s\": %s", file_data->filename,
2436                  strerror(errno));
2437         r = -1;
2438       }
2439     }
2440   }
2441
2442   tor_free(file_data->filename);
2443   tor_free(file_data->tempname);
2444   tor_free(file_data);
2445
2446   return r;
2447 }
2448
2449 /** Finish writing to <b>file_data</b>: close the file handle, free memory as
2450  * needed, and if using a temporary file, replace the original file with
2451  * the temporary file. */
2452 int
2453 finish_writing_to_file(open_file_t *file_data)
2454 {
2455   return finish_writing_to_file_impl(file_data, 0);
2456 }
2457
2458 /** Finish writing to <b>file_data</b>: close the file handle, free memory as
2459  * needed, and if using a temporary file, delete it. */
2460 int
2461 abort_writing_to_file(open_file_t *file_data)
2462 {
2463   return finish_writing_to_file_impl(file_data, 1);
2464 }
2465
2466 /** Helper: given a set of flags as passed to open(2), open the file
2467  * <b>fname</b> and write all the sized_chunk_t structs in <b>chunks</b> to
2468  * the file.  Do so as atomically as possible e.g. by opening temp files and
2469  * renaming. */
2470 static int
2471 write_chunks_to_file_impl(const char *fname, const smartlist_t *chunks,
2472                           int open_flags)
2473 {
2474   open_file_t *file = NULL;
2475   int fd;
2476   ssize_t result;
2477   fd = start_writing_to_file(fname, open_flags, 0600, &file);
2478   if (fd<0)
2479     return -1;
2480   SMARTLIST_FOREACH(chunks, sized_chunk_t *, chunk,
2481   {
2482     result = write_all(fd, chunk->bytes, chunk->len, 0);
2483     if (result < 0) {
2484       log_warn(LD_FS, "Error writing to \"%s\": %s", fname,
2485           strerror(errno));
2486       goto err;
2487     }
2488     tor_assert((size_t)result == chunk->len);
2489   });
2490
2491   return finish_writing_to_file(file);
2492  err:
2493   abort_writing_to_file(file);
2494   return -1;
2495 }
2496
2497 /** Given a smartlist of sized_chunk_t, write them to a file
2498  * <b>fname</b>, overwriting or creating the file as necessary.
2499  * If <b>no_tempfile</b> is 0 then the file will be written
2500  * atomically. */
2501 int
2502 write_chunks_to_file(const char *fname, const smartlist_t *chunks, int bin,
2503                      int no_tempfile)
2504 {
2505   int flags = OPEN_FLAGS_REPLACE|(bin?O_BINARY:O_TEXT);
2506
2507   if (no_tempfile) {
2508     /* O_APPEND stops write_chunks_to_file from using tempfiles */
2509     flags |= O_APPEND;
2510   }
2511   return write_chunks_to_file_impl(fname, chunks, flags);
2512 }
2513
2514 /** Write <b>len</b> bytes, starting at <b>str</b>, to <b>fname</b>
2515     using the open() flags passed in <b>flags</b>. */
2516 static int
2517 write_bytes_to_file_impl(const char *fname, const char *str, size_t len,
2518                          int flags)
2519 {
2520   int r;
2521   sized_chunk_t c = { str, len };
2522   smartlist_t *chunks = smartlist_new();
2523   smartlist_add(chunks, &c);
2524   r = write_chunks_to_file_impl(fname, chunks, flags);
2525   smartlist_free(chunks);
2526   return r;
2527 }
2528
2529 /** As write_str_to_file, but does not assume a NUL-terminated
2530  * string. Instead, we write <b>len</b> bytes, starting at <b>str</b>. */
2531 MOCK_IMPL(int,
2532 write_bytes_to_file,(const char *fname, const char *str, size_t len,
2533                      int bin))
2534 {
2535   return write_bytes_to_file_impl(fname, str, len,
2536                                   OPEN_FLAGS_REPLACE|(bin?O_BINARY:O_TEXT));
2537 }
2538
2539 /** As write_bytes_to_file, but if the file already exists, append the bytes
2540  * to the end of the file instead of overwriting it. */
2541 int
2542 append_bytes_to_file(const char *fname, const char *str, size_t len,
2543                      int bin)
2544 {
2545   return write_bytes_to_file_impl(fname, str, len,
2546                                   OPEN_FLAGS_APPEND|(bin?O_BINARY:O_TEXT));
2547 }
2548
2549 /** Like write_str_to_file(), but also return -1 if there was a file
2550     already residing in <b>fname</b>. */
2551 int
2552 write_bytes_to_new_file(const char *fname, const char *str, size_t len,
2553                         int bin)
2554 {
2555   return write_bytes_to_file_impl(fname, str, len,
2556                                   OPEN_FLAGS_DONT_REPLACE|
2557                                   (bin?O_BINARY:O_TEXT));
2558 }
2559
2560 /**
2561  * Read the contents of the open file <b>fd</b> presuming it is a FIFO
2562  * (or similar) file descriptor for which the size of the file isn't
2563  * known ahead of time. Return NULL on failure, and a NUL-terminated
2564  * string on success.  On success, set <b>sz_out</b> to the number of
2565  * bytes read.
2566  */
2567 char *
2568 read_file_to_str_until_eof(int fd, size_t max_bytes_to_read, size_t *sz_out)
2569 {
2570   ssize_t r;
2571   size_t pos = 0;
2572   char *string = NULL;
2573   size_t string_max = 0;
2574
2575   if (max_bytes_to_read+1 >= SIZE_T_CEILING)
2576     return NULL;
2577
2578   do {
2579     /* XXXX This "add 1K" approach is a little goofy; if we care about
2580      * performance here, we should be doubling.  But in practice we shouldn't
2581      * be using this function on big files anyway. */
2582     string_max = pos + 1024;
2583     if (string_max > max_bytes_to_read)
2584       string_max = max_bytes_to_read + 1;
2585     string = tor_realloc(string, string_max);
2586     r = read(fd, string + pos, string_max - pos - 1);
2587     if (r < 0) {
2588       tor_free(string);
2589       return NULL;
2590     }
2591
2592     pos += r;
2593   } while (r > 0 && pos < max_bytes_to_read);
2594
2595   tor_assert(pos < string_max);
2596   *sz_out = pos;
2597   string[pos] = '\0';
2598   return string;
2599 }
2600
2601 /** Read the contents of <b>filename</b> into a newly allocated
2602  * string; return the string on success or NULL on failure.
2603  *
2604  * If <b>stat_out</b> is provided, store the result of stat()ing the
2605  * file into <b>stat_out</b>.
2606  *
2607  * If <b>flags</b> &amp; RFTS_BIN, open the file in binary mode.
2608  * If <b>flags</b> &amp; RFTS_IGNORE_MISSING, don't warn if the file
2609  * doesn't exist.
2610  */
2611 /*
2612  * This function <em>may</em> return an erroneous result if the file
2613  * is modified while it is running, but must not crash or overflow.
2614  * Right now, the error case occurs when the file length grows between
2615  * the call to stat and the call to read_all: the resulting string will
2616  * be truncated.
2617  */
2618 char *
2619 read_file_to_str(const char *filename, int flags, struct stat *stat_out)
2620 {
2621   int fd; /* router file */
2622   struct stat statbuf;
2623   char *string;
2624   ssize_t r;
2625   int bin = flags & RFTS_BIN;
2626
2627   tor_assert(filename);
2628
2629   fd = tor_open_cloexec(filename,O_RDONLY|(bin?O_BINARY:O_TEXT),0);
2630   if (fd<0) {
2631     int severity = LOG_WARN;
2632     int save_errno = errno;
2633     if (errno == ENOENT && (flags & RFTS_IGNORE_MISSING))
2634       severity = LOG_INFO;
2635     log_fn(severity, LD_FS,"Could not open \"%s\": %s",filename,
2636            strerror(errno));
2637     errno = save_errno;
2638     return NULL;
2639   }
2640
2641   if (fstat(fd, &statbuf)<0) {
2642     int save_errno = errno;
2643     close(fd);
2644     log_warn(LD_FS,"Could not fstat \"%s\".",filename);
2645     errno = save_errno;
2646     return NULL;
2647   }
2648
2649 #ifndef _WIN32
2650 /** When we detect that we're reading from a FIFO, don't read more than
2651  * this many bytes.  It's insane overkill for most uses. */
2652 #define FIFO_READ_MAX (1024*1024)
2653   if (S_ISFIFO(statbuf.st_mode)) {
2654     size_t sz = 0;
2655     string = read_file_to_str_until_eof(fd, FIFO_READ_MAX, &sz);
2656     if (string && stat_out) {
2657       statbuf.st_size = sz;
2658       memcpy(stat_out, &statbuf, sizeof(struct stat));
2659     }
2660     close(fd);
2661     return string;
2662   }
2663 #endif
2664
2665   if ((uint64_t)(statbuf.st_size)+1 >= SIZE_T_CEILING) {
2666     close(fd);
2667     return NULL;
2668   }
2669
2670   string = tor_malloc((size_t)(statbuf.st_size+1));
2671
2672   r = read_all(fd,string,(size_t)statbuf.st_size,0);
2673   if (r<0) {
2674     int save_errno = errno;
2675     log_warn(LD_FS,"Error reading from file \"%s\": %s", filename,
2676              strerror(errno));
2677     tor_free(string);
2678     close(fd);
2679     errno = save_errno;
2680     return NULL;
2681   }
2682   string[r] = '\0'; /* NUL-terminate the result. */
2683
2684 #if defined(_WIN32) || defined(__CYGWIN__)
2685   if (!bin && strchr(string, '\r')) {
2686     log_debug(LD_FS, "We didn't convert CRLF to LF as well as we hoped "
2687               "when reading %s. Coping.",
2688               filename);
2689     tor_strstrip(string, "\r");
2690     r = strlen(string);
2691   }
2692   if (!bin) {
2693     statbuf.st_size = (size_t) r;
2694   } else
2695 #endif
2696     if (r != statbuf.st_size) {
2697       /* Unless we're using text mode on win32, we'd better have an exact
2698        * match for size. */
2699       int save_errno = errno;
2700       log_warn(LD_FS,"Could read only %d of %ld bytes of file \"%s\".",
2701                (int)r, (long)statbuf.st_size,filename);
2702       tor_free(string);
2703       close(fd);
2704       errno = save_errno;
2705       return NULL;
2706     }
2707   close(fd);
2708   if (stat_out) {
2709     memcpy(stat_out, &statbuf, sizeof(struct stat));
2710   }
2711
2712   return string;
2713 }
2714
2715 #define TOR_ISODIGIT(c) ('0' <= (c) && (c) <= '7')
2716
2717 /** Given a c-style double-quoted escaped string in <b>s</b>, extract and
2718  * decode its contents into a newly allocated string.  On success, assign this
2719  * string to *<b>result</b>, assign its length to <b>size_out</b> (if
2720  * provided), and return a pointer to the position in <b>s</b> immediately
2721  * after the string.  On failure, return NULL.
2722  */
2723 static const char *
2724 unescape_string(const char *s, char **result, size_t *size_out)
2725 {
2726   const char *cp;
2727   char *out;
2728   if (s[0] != '\"')
2729     return NULL;
2730   cp = s+1;
2731   while (1) {
2732     switch (*cp) {
2733       case '\0':
2734       case '\n':
2735         return NULL;
2736       case '\"':
2737         goto end_of_loop;
2738       case '\\':
2739         if (cp[1] == 'x' || cp[1] == 'X') {
2740           if (!(TOR_ISXDIGIT(cp[2]) && TOR_ISXDIGIT(cp[3])))
2741             return NULL;
2742           cp += 4;
2743         } else if (TOR_ISODIGIT(cp[1])) {
2744           cp += 2;
2745           if (TOR_ISODIGIT(*cp)) ++cp;
2746           if (TOR_ISODIGIT(*cp)) ++cp;
2747         } else if (cp[1] == 'n' || cp[1] == 'r' || cp[1] == 't' || cp[1] == '"'
2748                    || cp[1] == '\\' || cp[1] == '\'') {
2749           cp += 2;
2750         } else {
2751           return NULL;
2752         }
2753         break;
2754       default:
2755         ++cp;
2756         break;
2757     }
2758   }
2759  end_of_loop:
2760   out = *result = tor_malloc(cp-s + 1);
2761   cp = s+1;
2762   while (1) {
2763     switch (*cp)
2764       {
2765       case '\"':
2766         *out = '\0';
2767         if (size_out) *size_out = out - *result;
2768         return cp+1;
2769       case '\0':
2770         tor_fragile_assert();
2771         tor_free(*result);
2772         return NULL;
2773       case '\\':
2774         switch (cp[1])
2775           {
2776           case 'n': *out++ = '\n'; cp += 2; break;
2777           case 'r': *out++ = '\r'; cp += 2; break;
2778           case 't': *out++ = '\t'; cp += 2; break;
2779           case 'x': case 'X':
2780             {
2781               int x1, x2;
2782
2783               x1 = hex_decode_digit(cp[2]);
2784               x2 = hex_decode_digit(cp[3]);
2785               if (x1 == -1 || x2 == -1) {
2786                   tor_free(*result);
2787                   return NULL;
2788               }
2789
2790               *out++ = ((x1<<4) + x2);
2791               cp += 4;
2792             }
2793             break;
2794           case '0': case '1': case '2': case '3': case '4': case '5':
2795           case '6': case '7':
2796             {
2797               int n = cp[1]-'0';
2798               cp += 2;
2799               if (TOR_ISODIGIT(*cp)) { n = n*8 + *cp-'0'; cp++; }
2800               if (TOR_ISODIGIT(*cp)) { n = n*8 + *cp-'0'; cp++; }
2801               if (n > 255) { tor_free(*result); return NULL; }
2802               *out++ = (char)n;
2803             }
2804             break;
2805           case '\'':
2806           case '\"':
2807           case '\\':
2808           case '\?':
2809             *out++ = cp[1];
2810             cp += 2;
2811             break;
2812           default:
2813             tor_free(*result); return NULL;
2814           }
2815         break;
2816       default:
2817         *out++ = *cp++;
2818       }
2819   }
2820 }
2821
2822 /** Given a string containing part of a configuration file or similar format,
2823  * advance past comments and whitespace and try to parse a single line.  If we
2824  * parse a line successfully, set *<b>key_out</b> to a new string holding the
2825  * key portion and *<b>value_out</b> to a new string holding the value portion
2826  * of the line, and return a pointer to the start of the next line.  If we run
2827  * out of data, return a pointer to the end of the string.  If we encounter an
2828  * error, return NULL and set *<b>err_out</b> (if provided) to an error
2829  * message.
2830  */
2831 const char *
2832 parse_config_line_from_str_verbose(const char *line, char **key_out,
2833                                    char **value_out,
2834                                    const char **err_out)
2835 {
2836   /* I believe the file format here is supposed to be:
2837      FILE = (EMPTYLINE | LINE)* (EMPTYLASTLINE | LASTLINE)?
2838
2839      EMPTYLASTLINE = SPACE* | COMMENT
2840      EMPTYLINE = EMPTYLASTLINE NL
2841      SPACE = ' ' | '\r' | '\t'
2842      COMMENT = '#' NOT-NL*
2843      NOT-NL = Any character except '\n'
2844      NL = '\n'
2845
2846      LASTLINE = SPACE* KEY SPACE* VALUES
2847      LINE = LASTLINE NL
2848      KEY = KEYCHAR+
2849      KEYCHAR = Any character except ' ', '\r', '\n', '\t', '#', "\"
2850
2851      VALUES = QUOTEDVALUE | NORMALVALUE
2852      QUOTEDVALUE = QUOTE QVCHAR* QUOTE EOLSPACE?
2853      QUOTE = '"'
2854      QVCHAR = KEYCHAR | ESC ('n' | 't' | 'r' | '"' | ESC |'\'' | OCTAL | HEX)
2855      ESC = "\\"
2856      OCTAL = ODIGIT (ODIGIT ODIGIT?)?
2857      HEX = ('x' | 'X') HEXDIGIT HEXDIGIT
2858      ODIGIT = '0' .. '7'
2859      HEXDIGIT = '0'..'9' | 'a' .. 'f' | 'A' .. 'F'
2860      EOLSPACE = SPACE* COMMENT?
2861
2862      NORMALVALUE = (VALCHAR | ESC ESC_IGNORE | CONTINUATION)* EOLSPACE?
2863      VALCHAR = Any character except ESC, '#', and '\n'
2864      ESC_IGNORE = Any character except '#' or '\n'
2865      CONTINUATION = ESC NL ( COMMENT NL )*
2866    */
2867
2868   const char *key, *val, *cp;
2869   int continuation = 0;
2870
2871   tor_assert(key_out);
2872   tor_assert(value_out);
2873
2874   *key_out = *value_out = NULL;
2875   key = val = NULL;
2876   /* Skip until the first keyword. */
2877   while (1) {
2878     while (TOR_ISSPACE(*line))
2879       ++line;
2880     if (*line == '#') {
2881       while (*line && *line != '\n')
2882         ++line;
2883     } else {
2884       break;
2885     }
2886   }
2887
2888   if (!*line) { /* End of string? */
2889     *key_out = *value_out = NULL;
2890     return line;
2891   }
2892
2893   /* Skip until the next space or \ followed by newline. */
2894   key = line;
2895   while (*line && !TOR_ISSPACE(*line) && *line != '#' &&
2896          ! (line[0] == '\\' && line[1] == '\n'))
2897     ++line;
2898   *key_out = tor_strndup(key, line-key);
2899
2900   /* Skip until the value. */
2901   while (*line == ' ' || *line == '\t')
2902     ++line;
2903
2904   val = line;
2905
2906   /* Find the end of the line. */
2907   if (*line == '\"') { // XXX No continuation handling is done here
2908     if (!(line = unescape_string(line, value_out, NULL))) {
2909       if (err_out)
2910         *err_out = "Invalid escape sequence in quoted string";
2911       return NULL;
2912     }
2913     while (*line == ' ' || *line == '\t')
2914       ++line;
2915     if (*line && *line != '#' && *line != '\n') {
2916       if (err_out)
2917         *err_out = "Excess data after quoted string";
2918       return NULL;
2919     }
2920   } else {
2921     /* Look for the end of the line. */
2922     while (*line && *line != '\n' && (*line != '#' || continuation)) {
2923       if (*line == '\\' && line[1] == '\n') {
2924         continuation = 1;
2925         line += 2;
2926       } else if (*line == '#') {
2927         do {
2928           ++line;
2929         } while (*line && *line != '\n');
2930         if (*line == '\n')
2931           ++line;
2932       } else {
2933         ++line;
2934       }
2935     }
2936
2937     if (*line == '\n') {
2938       cp = line++;
2939     } else {
2940       cp = line;
2941     }
2942     /* Now back cp up to be the last nonspace character */
2943     while (cp>val && TOR_ISSPACE(*(cp-1)))
2944       --cp;
2945
2946     tor_assert(cp >= val);
2947
2948     /* Now copy out and decode the value. */
2949     *value_out = tor_strndup(val, cp-val);
2950     if (continuation) {
2951       char *v_out, *v_in;
2952       v_out = v_in = *value_out;
2953       while (*v_in) {
2954         if (*v_in == '#') {
2955           do {
2956             ++v_in;
2957           } while (*v_in && *v_in != '\n');
2958           if (*v_in == '\n')
2959             ++v_in;
2960         } else if (v_in[0] == '\\' && v_in[1] == '\n') {
2961           v_in += 2;
2962         } else {
2963           *v_out++ = *v_in++;
2964         }
2965       }
2966       *v_out = '\0';
2967     }
2968   }
2969
2970   if (*line == '#') {
2971     do {
2972       ++line;
2973     } while (*line && *line != '\n');
2974   }
2975   while (TOR_ISSPACE(*line)) ++line;
2976
2977   return line;
2978 }
2979
2980 /** Expand any homedir prefix on <b>filename</b>; return a newly allocated
2981  * string. */
2982 char *
2983 expand_filename(const char *filename)
2984 {
2985   tor_assert(filename);
2986 #ifdef _WIN32
2987   return tor_strdup(filename);
2988 #else
2989   if (*filename == '~') {
2990     char *home, *result=NULL;
2991     const char *rest;
2992
2993     if (filename[1] == '/' || filename[1] == '\0') {
2994       home = getenv("HOME");
2995       if (!home) {
2996         log_warn(LD_CONFIG, "Couldn't find $HOME environment variable while "
2997                  "expanding \"%s\"; defaulting to \"\".", filename);
2998         home = tor_strdup("");
2999       } else {
3000         home = tor_strdup(home);
3001       }
3002       rest = strlen(filename)>=2?(filename+2):"";
3003     } else {
3004 #ifdef HAVE_PWD_H
3005       char *username, *slash;
3006       slash = strchr(filename, '/');
3007       if (slash)
3008         username = tor_strndup(filename+1,slash-filename-1);
3009       else
3010         username = tor_strdup(filename+1);
3011       if (!(home = get_user_homedir(username))) {
3012         log_warn(LD_CONFIG,"Couldn't get homedir for \"%s\"",username);
3013         tor_free(username);
3014         return NULL;
3015       }
3016       tor_free(username);
3017       rest = slash ? (slash+1) : "";
3018 #else
3019       log_warn(LD_CONFIG, "Couldn't expand homedir on system without pwd.h");
3020       return tor_strdup(filename);
3021 #endif
3022     }
3023     tor_assert(home);
3024     /* Remove trailing slash. */
3025     if (strlen(home)>1 && !strcmpend(home,PATH_SEPARATOR)) {
3026       home[strlen(home)-1] = '\0';
3027     }
3028     tor_asprintf(&result,"%s"PATH_SEPARATOR"%s",home,rest);
3029     tor_free(home);
3030     return result;
3031   } else {
3032     return tor_strdup(filename);
3033   }
3034 #endif
3035 }
3036
3037 #define MAX_SCANF_WIDTH 9999
3038
3039 /** Helper: given an ASCII-encoded decimal digit, return its numeric value.
3040  * NOTE: requires that its input be in-bounds. */
3041 static int
3042 digit_to_num(char d)
3043 {
3044   int num = ((int)d) - (int)'0';
3045   tor_assert(num <= 9 && num >= 0);
3046   return num;
3047 }
3048
3049 /** Helper: Read an unsigned int from *<b>bufp</b> of up to <b>width</b>
3050  * characters.  (Handle arbitrary width if <b>width</b> is less than 0.)  On
3051  * success, store the result in <b>out</b>, advance bufp to the next
3052  * character, and return 0.  On failure, return -1. */
3053 static int
3054 scan_unsigned(const char **bufp, unsigned long *out, int width, int base)
3055 {
3056   unsigned long result = 0;
3057   int scanned_so_far = 0;
3058   const int hex = base==16;
3059   tor_assert(base == 10 || base == 16);
3060   if (!bufp || !*bufp || !out)
3061     return -1;
3062   if (width<0)
3063     width=MAX_SCANF_WIDTH;
3064
3065   while (**bufp && (hex?TOR_ISXDIGIT(**bufp):TOR_ISDIGIT(**bufp))
3066          && scanned_so_far < width) {
3067     int digit = hex?hex_decode_digit(*(*bufp)++):digit_to_num(*(*bufp)++);
3068     // Check for overflow beforehand, without actually causing any overflow
3069     // This preserves functionality on compilers that don't wrap overflow
3070     // (i.e. that trap or optimise away overflow)
3071     // result * base + digit > ULONG_MAX
3072     // result * base > ULONG_MAX - digit
3073     if (result > (ULONG_MAX - digit)/base)
3074       return -1; /* Processing this digit would overflow */
3075     result = result * base + digit;
3076     ++scanned_so_far;
3077   }
3078
3079   if (!scanned_so_far) /* No actual digits scanned */
3080     return -1;
3081
3082   *out = result;
3083   return 0;
3084 }
3085
3086 /** Helper: Read an signed int from *<b>bufp</b> of up to <b>width</b>
3087  * characters.  (Handle arbitrary width if <b>width</b> is less than 0.)  On
3088  * success, store the result in <b>out</b>, advance bufp to the next
3089  * character, and return 0.  On failure, return -1. */
3090 static int
3091 scan_signed(const char **bufp, long *out, int width)
3092 {
3093   int neg = 0;
3094   unsigned long result = 0;
3095
3096   if (!bufp || !*bufp || !out)
3097     return -1;
3098   if (width<0)
3099     width=MAX_SCANF_WIDTH;
3100
3101   if (**bufp == '-') {
3102     neg = 1;
3103     ++*bufp;
3104     --width;
3105   }
3106
3107   if (scan_unsigned(bufp, &result, width, 10) < 0)
3108     return -1;
3109
3110   if (neg && result > 0) {
3111     if (result > ((unsigned long)LONG_MAX) + 1)
3112       return -1; /* Underflow */
3113     // Avoid overflow on the cast to signed long when result is LONG_MIN
3114     // by subtracting 1 from the unsigned long positive value,
3115     // then, after it has been cast to signed and negated,
3116     // subtracting the original 1 (the double-subtraction is intentional).
3117     // Otherwise, the cast to signed could cause a temporary long
3118     // to equal LONG_MAX + 1, which is undefined.
3119     // We avoid underflow on the subtraction by treating -0 as positive.
3120     *out = (-(long)(result - 1)) - 1;
3121   } else {
3122     if (result > LONG_MAX)
3123       return -1; /* Overflow */
3124     *out = (long)result;
3125   }
3126
3127   return 0;
3128 }
3129
3130 /** Helper: Read a decimal-formatted double from *<b>bufp</b> of up to
3131  * <b>width</b> characters.  (Handle arbitrary width if <b>width</b> is less
3132  * than 0.)  On success, store the result in <b>out</b>, advance bufp to the
3133  * next character, and return 0.  On failure, return -1. */
3134 static int
3135 scan_double(const char **bufp, double *out, int width)
3136 {
3137   int neg = 0;
3138   double result = 0;
3139   int scanned_so_far = 0;
3140
3141   if (!bufp || !*bufp || !out)
3142     return -1;
3143   if (width<0)
3144     width=MAX_SCANF_WIDTH;
3145
3146   if (**bufp == '-') {
3147     neg = 1;
3148     ++*bufp;
3149   }
3150
3151   while (**bufp && TOR_ISDIGIT(**bufp) && scanned_so_far < width) {
3152     const int digit = digit_to_num(*(*bufp)++);
3153     result = result * 10 + digit;
3154     ++scanned_so_far;
3155   }
3156   if (**bufp == '.') {
3157     double fracval = 0, denominator = 1;
3158     ++*bufp;
3159     ++scanned_so_far;
3160     while (**bufp && TOR_ISDIGIT(**bufp) && scanned_so_far < width) {
3161       const int digit = digit_to_num(*(*bufp)++);
3162       fracval = fracval * 10 + digit;
3163       denominator *= 10;
3164       ++scanned_so_far;
3165     }
3166     result += fracval / denominator;
3167   }
3168
3169   if (!scanned_so_far) /* No actual digits scanned */
3170     return -1;
3171
3172   *out = neg ? -result : result;
3173   return 0;
3174 }
3175
3176 /** Helper: copy up to <b>width</b> non-space characters from <b>bufp</b> to
3177  * <b>out</b>.  Make sure <b>out</b> is nul-terminated. Advance <b>bufp</b>
3178  * to the next non-space character or the EOS. */
3179 static int
3180 scan_string(const char **bufp, char *out, int width)
3181 {
3182   int scanned_so_far = 0;
3183   if (!bufp || !out || width < 0)
3184     return -1;
3185   while (**bufp && ! TOR_ISSPACE(**bufp) && scanned_so_far < width) {
3186     *out++ = *(*bufp)++;
3187     ++scanned_so_far;
3188   }
3189   *out = '\0';
3190   return 0;
3191 }
3192
3193 /** Locale-independent, minimal, no-surprises scanf variant, accepting only a
3194  * restricted pattern format.  For more info on what it supports, see
3195  * tor_sscanf() documentation.  */
3196 int
3197 tor_vsscanf(const char *buf, const char *pattern, va_list ap)
3198 {
3199   int n_matched = 0;
3200
3201   while (*pattern) {
3202     if (*pattern != '%') {
3203       if (*buf == *pattern) {
3204         ++buf;
3205         ++pattern;
3206         continue;
3207       } else {
3208         return n_matched;
3209       }
3210     } else {
3211       int width = -1;
3212       int longmod = 0;
3213       ++pattern;
3214       if (TOR_ISDIGIT(*pattern)) {
3215         width = digit_to_num(*pattern++);
3216         while (TOR_ISDIGIT(*pattern)) {
3217           width *= 10;
3218           width += digit_to_num(*pattern++);
3219           if (width > MAX_SCANF_WIDTH)
3220             return -1;
3221         }
3222         if (!width) /* No zero-width things. */
3223           return -1;
3224       }
3225       if (*pattern == 'l') {
3226         longmod = 1;
3227         ++pattern;
3228       }
3229       if (*pattern == 'u' || *pattern == 'x') {
3230         unsigned long u;
3231         const int base = (*pattern == 'u') ? 10 : 16;
3232         if (!*buf)
3233           return n_matched;
3234         if (scan_unsigned(&buf, &u, width, base)<0)
3235           return n_matched;
3236         if (longmod) {
3237           unsigned long *out = va_arg(ap, unsigned long *);
3238           *out = u;
3239         } else {
3240           unsigned *out = va_arg(ap, unsigned *);
3241           if (u > UINT_MAX)
3242             return n_matched;
3243           *out = (unsigned) u;
3244         }
3245         ++pattern;
3246         ++n_matched;
3247       } else if (*pattern == 'f') {
3248         double *d = va_arg(ap, double *);
3249         if (!longmod)
3250           return -1; /* float not supported */
3251         if (!*buf)
3252           return n_matched;
3253         if (scan_double(&buf, d, width)<0)
3254           return n_matched;
3255         ++pattern;
3256         ++n_matched;
3257       } else if (*pattern == 'd') {
3258         long lng=0;
3259         if (scan_signed(&buf, &lng, width)<0)
3260           return n_matched;
3261         if (longmod) {
3262           long *out = va_arg(ap, long *);
3263           *out = lng;
3264         } else {
3265           int *out = va_arg(ap, int *);
3266           if (lng < INT_MIN || lng > INT_MAX)
3267             return n_matched;
3268           *out = (int)lng;
3269         }
3270         ++pattern;
3271         ++n_matched;
3272       } else if (*pattern == 's') {
3273         char *s = va_arg(ap, char *);
3274         if (longmod)
3275           return -1;
3276         if (width < 0)
3277           return -1;
3278         if (scan_string(&buf, s, width)<0)
3279           return n_matched;
3280         ++pattern;
3281         ++n_matched;
3282       } else if (*pattern == 'c') {
3283         char *ch = va_arg(ap, char *);
3284         if (longmod)
3285           return -1;
3286         if (width != -1)
3287           return -1;
3288         if (!*buf)
3289           return n_matched;
3290         *ch = *buf++;
3291         ++pattern;
3292         ++n_matched;
3293       } else if (*pattern == '%') {
3294         if (*buf != '%')
3295           return n_matched;
3296         if (longmod)
3297           return -1;
3298         ++buf;
3299         ++pattern;
3300       } else {
3301         return -1; /* Unrecognized pattern component. */
3302       }
3303     }
3304   }
3305
3306   return n_matched;
3307 }
3308
3309 /** Minimal sscanf replacement: parse <b>buf</b> according to <b>pattern</b>
3310  * and store the results in the corresponding argument fields.  Differs from
3311  * sscanf in that:
3312  * <ul><li>It only handles %u, %lu, %x, %lx, %[NUM]s, %d, %ld, %lf, and %c.
3313  *     <li>It only handles decimal inputs for %lf. (12.3, not 1.23e1)
3314  *     <li>It does not handle arbitrarily long widths.
3315  *     <li>Numbers do not consume any space characters.
3316  *     <li>It is locale-independent.
3317  *     <li>%u and %x do not consume any space.
3318  *     <li>It returns -1 on malformed patterns.</ul>
3319  *
3320  * (As with other locale-independent functions, we need this to parse data that
3321  * is in ASCII without worrying that the C library's locale-handling will make
3322  * miscellaneous characters look like numbers, spaces, and so on.)
3323  */
3324 int
3325 tor_sscanf(const char *buf, const char *pattern, ...)
3326 {
3327   int r;
3328   va_list ap;
3329   va_start(ap, pattern);
3330   r = tor_vsscanf(buf, pattern, ap);
3331   va_end(ap);
3332   return r;
3333 }
3334
3335 /** Append the string produced by tor_asprintf(<b>pattern</b>, <b>...</b>)
3336  * to <b>sl</b>. */
3337 void
3338 smartlist_add_asprintf(struct smartlist_t *sl, const char *pattern, ...)
3339 {
3340   va_list ap;
3341   va_start(ap, pattern);
3342   smartlist_add_vasprintf(sl, pattern, ap);
3343   va_end(ap);
3344 }
3345
3346 /** va_list-based backend of smartlist_add_asprintf. */
3347 void
3348 smartlist_add_vasprintf(struct smartlist_t *sl, const char *pattern,
3349                         va_list args)
3350 {
3351   char *str = NULL;
3352
3353   tor_vasprintf(&str, pattern, args);
3354   tor_assert(str != NULL);
3355
3356   smartlist_add(sl, str);
3357 }
3358
3359 /** Return a new list containing the filenames in the directory <b>dirname</b>.
3360  * Return NULL on error or if <b>dirname</b> is not a directory.
3361  */
3362 smartlist_t *
3363 tor_listdir(const char *dirname)
3364 {
3365   smartlist_t *result;
3366 #ifdef _WIN32
3367   char *pattern=NULL;
3368   TCHAR tpattern[MAX_PATH] = {0};
3369   char name[MAX_PATH*2+1] = {0};
3370   HANDLE handle;
3371   WIN32_FIND_DATA findData;
3372   tor_asprintf(&pattern, "%s\\*", dirname);
3373 #ifdef UNICODE
3374   mbstowcs(tpattern,pattern,MAX_PATH);
3375 #else
3376   strlcpy(tpattern, pattern, MAX_PATH);
3377 #endif
3378   if (INVALID_HANDLE_VALUE == (handle = FindFirstFile(tpattern, &findData))) {
3379     tor_free(pattern);
3380     return NULL;
3381   }
3382   result = smartlist_new();
3383   while (1) {
3384 #ifdef UNICODE
3385     wcstombs(name,findData.cFileName,MAX_PATH);
3386     name[sizeof(name)-1] = '\0';
3387 #else
3388     strlcpy(name,findData.cFileName,sizeof(name));
3389 #endif
3390     if (strcmp(name, ".") &&
3391         strcmp(name, "..")) {
3392       smartlist_add(result, tor_strdup(name));
3393     }
3394     if (!FindNextFile(handle, &findData)) {
3395       DWORD err;
3396       if ((err = GetLastError()) != ERROR_NO_MORE_FILES) {
3397         char *errstr = format_win32_error(err);
3398         log_warn(LD_FS, "Error reading directory '%s': %s", dirname, errstr);
3399         tor_free(errstr);
3400       }
3401       break;
3402     }
3403   }
3404   FindClose(handle);
3405   tor_free(pattern);
3406 #else
3407   const char *prot_dname = sandbox_intern_string(dirname);
3408   DIR *d;
3409   struct dirent *de;
3410   if (!(d = opendir(prot_dname)))
3411     return NULL;
3412
3413   result = smartlist_new();
3414   while ((de = readdir(d))) {
3415     if (!strcmp(de->d_name, ".") ||
3416         !strcmp(de->d_name, ".."))
3417       continue;
3418     smartlist_add(result, tor_strdup(de->d_name));
3419   }
3420   closedir(d);
3421 #endif
3422   return result;
3423 }
3424
3425 /** Return true iff <b>filename</b> is a relative path. */
3426 int
3427 path_is_relative(const char *filename)
3428 {
3429   if (filename && filename[0] == '/')
3430     return 0;
3431 #ifdef _WIN32
3432   else if (filename && filename[0] == '\\')
3433     return 0;
3434   else if (filename && strlen(filename)>3 && TOR_ISALPHA(filename[0]) &&
3435            filename[1] == ':' && filename[2] == '\\')
3436     return 0;
3437 #endif
3438   else
3439     return 1;
3440 }
3441
3442 /* =====
3443  * Process helpers
3444  * ===== */
3445
3446 #ifndef _WIN32
3447 /* Based on code contributed by christian grothoff */
3448 /** True iff we've called start_daemon(). */
3449 static int start_daemon_called = 0;
3450 /** True iff we've called finish_daemon(). */
3451 static int finish_daemon_called = 0;
3452 /** Socketpair used to communicate between parent and child process while
3453  * daemonizing. */
3454 static int daemon_filedes[2];
3455 /** Start putting the process into daemon mode: fork and drop all resources
3456  * except standard fds.  The parent process never returns, but stays around
3457  * until finish_daemon is called.  (Note: it's safe to call this more
3458  * than once: calls after the first are ignored.)
3459  */
3460 void
3461 start_daemon(void)
3462 {
3463   pid_t pid;
3464
3465   if (start_daemon_called)
3466     return;
3467   start_daemon_called = 1;
3468
3469   if (pipe(daemon_filedes)) {
3470     log_err(LD_GENERAL,"pipe failed; exiting. Error was %s", strerror(errno));
3471     exit(1);
3472   }
3473   pid = fork();
3474   if (pid < 0) {
3475     log_err(LD_GENERAL,"fork failed. Exiting.");
3476     exit(1);
3477   }
3478   if (pid) {  /* Parent */
3479     int ok;
3480     char c;
3481
3482     close(daemon_filedes[1]); /* we only read */
3483     ok = -1;
3484     while (0 < read(daemon_filedes[0], &c, sizeof(char))) {
3485       if (c == '.')
3486         ok = 1;
3487     }
3488     fflush(stdout);
3489     if (ok == 1)
3490       exit(0);
3491     else
3492       exit(1); /* child reported error */
3493   } else { /* Child */
3494     close(daemon_filedes[0]); /* we only write */
3495
3496     pid = setsid(); /* Detach from controlling terminal */
3497     /*
3498      * Fork one more time, so the parent (the session group leader) can exit.
3499      * This means that we, as a non-session group leader, can never regain a
3500      * controlling terminal.   This part is recommended by Stevens's
3501      * _Advanced Programming in the Unix Environment_.
3502      */
3503     if (fork() != 0) {
3504       exit(0);
3505     }
3506     set_main_thread(); /* We are now the main thread. */
3507
3508     return;
3509   }
3510 }
3511
3512 /** Finish putting the process into daemon mode: drop standard fds, and tell
3513  * the parent process to exit.  (Note: it's safe to call this more than once:
3514  * calls after the first are ignored.  Calls start_daemon first if it hasn't
3515  * been called already.)
3516  */
3517 void
3518 finish_daemon(const char *desired_cwd)
3519 {
3520   int nullfd;
3521   char c = '.';
3522   if (finish_daemon_called)
3523     return;
3524   if (!start_daemon_called)
3525     start_daemon();
3526   finish_daemon_called = 1;
3527
3528   if (!desired_cwd)
3529     desired_cwd = "/";
3530    /* Don't hold the wrong FS mounted */
3531   if (chdir(desired_cwd) < 0) {
3532     log_err(LD_GENERAL,"chdir to \"%s\" failed. Exiting.",desired_cwd);
3533     exit(1);
3534   }
3535
3536   nullfd = tor_open_cloexec("/dev/null", O_RDWR, 0);
3537   if (nullfd < 0) {
3538     log_err(LD_GENERAL,"/dev/null can't be opened. Exiting.");
3539     exit(1);
3540   }
3541   /* close fds linking to invoking terminal, but
3542    * close usual incoming fds, but redirect them somewhere
3543    * useful so the fds don't get reallocated elsewhere.
3544    */
3545   if (dup2(nullfd,0) < 0 ||
3546       dup2(nullfd,1) < 0 ||
3547       dup2(nullfd,2) < 0) {
3548     log_err(LD_GENERAL,"dup2 failed. Exiting.");
3549     exit(1);
3550   }
3551   if (nullfd > 2)
3552     close(nullfd);
3553   /* signal success */
3554   if (write(daemon_filedes[1], &c, sizeof(char)) != sizeof(char)) {
3555     log_err(LD_GENERAL,"write failed. Exiting.");
3556   }
3557   close(daemon_filedes[1]);
3558 }
3559 #else
3560 /* defined(_WIN32) */
3561 void
3562 start_daemon(void)
3563 {
3564 }
3565 void
3566 finish_daemon(const char *cp)
3567 {
3568   (void)cp;
3569 }
3570 #endif
3571
3572 /** Write the current process ID, followed by NL, into <b>filename</b>.
3573  */
3574 void
3575 write_pidfile(char *filename)
3576 {
3577   FILE *pidfile;
3578
3579   if ((pidfile = fopen(filename, "w")) == NULL) {
3580     log_warn(LD_FS, "Unable to open \"%s\" for writing: %s", filename,
3581              strerror(errno));
3582   } else {
3583 #ifdef _WIN32
3584     fprintf(pidfile, "%d\n", (int)_getpid());
3585 #else
3586     fprintf(pidfile, "%d\n", (int)getpid());
3587 #endif
3588     fclose(pidfile);
3589   }
3590 }
3591
3592 #ifdef _WIN32
3593 HANDLE
3594 load_windows_system_library(const TCHAR *library_name)
3595 {
3596   TCHAR path[MAX_PATH];
3597   unsigned n;
3598   n = GetSystemDirectory(path, MAX_PATH);
3599   if (n == 0 || n + _tcslen(library_name) + 2 >= MAX_PATH)
3600     return 0;
3601   _tcscat(path, TEXT("\\"));
3602   _tcscat(path, library_name);
3603   return LoadLibrary(path);
3604 }
3605 #endif
3606
3607 /** Format a single argument for being put on a Windows command line.
3608  * Returns a newly allocated string */
3609 static char *
3610 format_win_cmdline_argument(const char *arg)
3611 {
3612   char *formatted_arg;
3613   char need_quotes;
3614   const char *c;
3615   int i;
3616   int bs_counter = 0;
3617   /* Backslash we can point to when one is inserted into the string */
3618   const char backslash = '\\';
3619
3620   /* Smartlist of *char */
3621   smartlist_t *arg_chars;
3622   arg_chars = smartlist_new();
3623
3624   /* Quote string if it contains whitespace or is empty */
3625   need_quotes = (strchr(arg, ' ') || strchr(arg, '\t') || '\0' == arg[0]);
3626
3627   /* Build up smartlist of *chars */
3628   for (c=arg; *c != '\0'; c++) {
3629     if ('"' == *c) {
3630       /* Double up backslashes preceding a quote */
3631       for (i=0; i<(bs_counter*2); i++)
3632         smartlist_add(arg_chars, (void*)&backslash);
3633       bs_counter = 0;
3634       /* Escape the quote */
3635       smartlist_add(arg_chars, (void*)&backslash);
3636       smartlist_add(arg_chars, (void*)c);
3637     } else if ('\\' == *c) {
3638       /* Count backslashes until we know whether to double up */
3639       bs_counter++;
3640     } else {
3641       /* Don't double up slashes preceding a non-quote */
3642       for (i=0; i<bs_counter; i++)
3643         smartlist_add(arg_chars, (void*)&backslash);
3644       bs_counter = 0;
3645       smartlist_add(arg_chars, (void*)c);
3646     }
3647   }
3648   /* Don't double up trailing backslashes */
3649   for (i=0; i<bs_counter; i++)
3650     smartlist_add(arg_chars, (void*)&backslash);
3651
3652   /* Allocate space for argument, quotes (if needed), and terminator */
3653   const size_t formatted_arg_len = smartlist_len(arg_chars) +
3654     (need_quotes ? 2 : 0) + 1;
3655   formatted_arg = tor_malloc_zero(formatted_arg_len);
3656
3657   /* Add leading quote */
3658   i=0;
3659   if (need_quotes)
3660     formatted_arg[i++] = '"';
3661
3662   /* Add characters */
3663   SMARTLIST_FOREACH(arg_chars, char*, c,
3664   {
3665     formatted_arg[i++] = *c;
3666   });
3667
3668   /* Add trailing quote */
3669   if (need_quotes)
3670     formatted_arg[i++] = '"';
3671   formatted_arg[i] = '\0';
3672
3673   smartlist_free(arg_chars);
3674   return formatted_arg;
3675 }
3676
3677 /** Format a command line for use on Windows, which takes the command as a
3678  * string rather than string array. Follows the rules from "Parsing C++
3679  * Command-Line Arguments" in MSDN. Algorithm based on list2cmdline in the
3680  * Python subprocess module. Returns a newly allocated string */
3681 char *
3682 tor_join_win_cmdline(const char *argv[])
3683 {
3684   smartlist_t *argv_list;
3685   char *joined_argv;
3686   int i;
3687
3688   /* Format each argument and put the result in a smartlist */
3689   argv_list = smartlist_new();
3690   for (i=0; argv[i] != NULL; i++) {
3691     smartlist_add(argv_list, (void *)format_win_cmdline_argument(argv[i]));
3692   }
3693
3694   /* Join the arguments with whitespace */
3695   joined_argv = smartlist_join_strings(argv_list, " ", 0, NULL);
3696
3697   /* Free the newly allocated arguments, and the smartlist */
3698   SMARTLIST_FOREACH(argv_list, char *, arg,
3699   {
3700     tor_free(arg);
3701   });
3702   smartlist_free(argv_list);
3703
3704   return joined_argv;
3705 }
3706
3707 /* As format_{hex,dex}_number_sigsafe, but takes a <b>radix</b> argument
3708  * in range 2..16 inclusive. */
3709 static int
3710 format_number_sigsafe(unsigned long x, char *buf, int buf_len,
3711                       unsigned int radix)
3712 {
3713   unsigned long tmp;
3714   int len;
3715   char *cp;
3716
3717   /* NOT tor_assert. This needs to be safe to run from within a signal handler,
3718    * and from within the 'tor_assert() has failed' code. */
3719   if (radix < 2 || radix > 16)
3720     return 0;
3721
3722   /* Count how many digits we need. */
3723   tmp = x;
3724   len = 1;
3725   while (tmp >= radix) {
3726     tmp /= radix;
3727     ++len;
3728   }
3729
3730   /* Not long enough */
3731   if (!buf || len >= buf_len)
3732     return 0;
3733
3734   cp = buf + len;
3735   *cp = '\0';
3736   do {
3737     unsigned digit = (unsigned) (x % radix);
3738     tor_assert(cp > buf);
3739     --cp;
3740     *cp = "0123456789ABCDEF"[digit];
3741     x /= radix;
3742   } while (x);
3743
3744   /* NOT tor_assert; see above. */
3745   if (cp != buf) {
3746     abort();
3747   }
3748
3749   return len;
3750 }
3751
3752 /**
3753  * Helper function to output hex numbers from within a signal handler.
3754  *
3755  * Writes the nul-terminated hexadecimal digits of <b>x</b> into a buffer
3756  * <b>buf</b> of size <b>buf_len</b>, and return the actual number of digits
3757  * written, not counting the terminal NUL.
3758  *
3759  * If there is insufficient space, write nothing and return 0.
3760  *
3761  * This accepts an unsigned int because format_helper_exit_status() needs to
3762  * call it with a signed int and an unsigned char, and since the C standard
3763  * does not guarantee that an int is wider than a char (an int must be at
3764  * least 16 bits but it is permitted for a char to be that wide as well), we
3765  * can't assume a signed int is sufficient to accomodate an unsigned char.
3766  * Thus, format_helper_exit_status() will still need to emit any require '-'
3767  * on its own.
3768  *
3769  * For most purposes, you'd want to use tor_snprintf("%x") instead of this
3770  * function; it's designed to be used in code paths where you can't call
3771  * arbitrary C functions.
3772  */
3773 int
3774 format_hex_number_sigsafe(unsigned long x, char *buf, int buf_len)
3775 {
3776   return format_number_sigsafe(x, buf, buf_len, 16);
3777 }
3778
3779 /** As format_hex_number_sigsafe, but format the number in base 10. */
3780 int
3781 format_dec_number_sigsafe(unsigned long x, char *buf, int buf_len)
3782 {
3783   return format_number_sigsafe(x, buf, buf_len, 10);
3784 }
3785
3786 #ifndef _WIN32
3787 /** Format <b>child_state</b> and <b>saved_errno</b> as a hex string placed in
3788  * <b>hex_errno</b>.  Called between fork and _exit, so must be signal-handler
3789  * safe.
3790  *
3791  * <b>hex_errno</b> must have at least HEX_ERRNO_SIZE+1 bytes available.
3792  *
3793  * The format of <b>hex_errno</b> is: "CHILD_STATE/ERRNO\n", left-padded
3794  * with spaces. CHILD_STATE indicates where
3795  * in the processs of starting the child process did the failure occur (see
3796  * CHILD_STATE_* macros for definition), and SAVED_ERRNO is the value of
3797  * errno when the failure occurred.
3798  *
3799  * On success return the number of characters added to hex_errno, not counting
3800  * the terminating NUL; return -1 on error.
3801  */
3802 STATIC int
3803 format_helper_exit_status(unsigned char child_state, int saved_errno,
3804                           char *hex_errno)
3805 {
3806   unsigned int unsigned_errno;
3807   int written, left;
3808   char *cur;
3809   size_t i;
3810   int res = -1;
3811
3812   /* Fill hex_errno with spaces, and a trailing newline (memset may
3813      not be signal handler safe, so we can't use it) */
3814   for (i = 0; i < (HEX_ERRNO_SIZE - 1); i++)
3815     hex_errno[i] = ' ';
3816   hex_errno[HEX_ERRNO_SIZE - 1] = '\n';
3817
3818   /* Convert errno to be unsigned for hex conversion */
3819   if (saved_errno < 0) {
3820     // Avoid overflow on the cast to unsigned int when result is INT_MIN
3821     // by adding 1 to the signed int negative value,
3822     // then, after it has been negated and cast to unsigned,
3823     // adding the original 1 back (the double-addition is intentional).
3824     // Otherwise, the cast to signed could cause a temporary int
3825     // to equal INT_MAX + 1, which is undefined.
3826     unsigned_errno = ((unsigned int) -(saved_errno + 1)) + 1;
3827   } else {
3828     unsigned_errno = (unsigned int) saved_errno;
3829   }
3830
3831   /*
3832    * Count how many chars of space we have left, and keep a pointer into the
3833    * current point in the buffer.
3834    */
3835   left = HEX_ERRNO_SIZE+1;
3836   cur = hex_errno;
3837
3838   /* Emit child_state */
3839   written = format_hex_number_sigsafe(child_state, cur, left);
3840
3841   if (written <= 0)
3842     goto err;
3843
3844   /* Adjust left and cur */
3845   left -= written;
3846   cur += written;
3847   if (left <= 0)
3848     goto err;
3849
3850   /* Now the '/' */
3851   *cur = '/';
3852
3853   /* Adjust left and cur */
3854   ++cur;
3855   --left;
3856   if (left <= 0)
3857     goto err;
3858
3859   /* Need minus? */
3860   if (saved_errno < 0) {
3861     *cur = '-';
3862     ++cur;
3863     --left;
3864     if (left <= 0)
3865       goto err;
3866   }
3867
3868   /* Emit unsigned_errno */
3869   written = format_hex_number_sigsafe(unsigned_errno, cur, left);
3870
3871   if (written <= 0)
3872     goto err;
3873
3874   /* Adjust left and cur */
3875   left -= written;
3876   cur += written;
3877
3878   /* Check that we have enough space left for a newline and a NUL */
3879   if (left <= 1)
3880     goto err;
3881
3882   /* Emit the newline and NUL */
3883   *cur++ = '\n';
3884   *cur++ = '\0';
3885
3886   res = (int)(cur - hex_errno - 1);
3887
3888   goto done;
3889
3890  err:
3891   /*
3892    * In error exit, just write a '\0' in the first char so whatever called
3893    * this at least won't fall off the end.
3894    */
3895   *hex_errno = '\0';
3896
3897  done:
3898   return res;
3899 }
3900 #endif
3901
3902 /* Maximum number of file descriptors, if we cannot get it via sysconf() */
3903 #define DEFAULT_MAX_FD 256
3904
3905 /** Terminate the process of <b>process_handle</b>.
3906  *  Code borrowed from Python's os.kill. */
3907 int
3908 tor_terminate_process(process_handle_t *process_handle)
3909 {
3910 #ifdef _WIN32
3911   if (tor_get_exit_code(process_handle, 0, NULL) == PROCESS_EXIT_RUNNING) {
3912     HANDLE handle = process_handle->pid.hProcess;
3913
3914     if (!TerminateProcess(handle, 0))
3915       return -1;
3916     else
3917       return 0;
3918   }
3919 #else /* Unix */
3920   if (process_handle->waitpid_cb) {
3921     /* We haven't got a waitpid yet, so we can just kill off the process. */
3922     return kill(process_handle->pid, SIGTERM);
3923   }
3924 #endif
3925
3926   return -1;
3927 }
3928
3929 /** Return the Process ID of <b>process_handle</b>. */
3930 int
3931 tor_process_get_pid(process_handle_t *process_handle)
3932 {
3933 #ifdef _WIN32
3934   return (int) process_handle->pid.dwProcessId;
3935 #else
3936   return (int) process_handle->pid;
3937 #endif
3938 }
3939
3940 #ifdef _WIN32
3941 HANDLE
3942 tor_process_get_stdout_pipe(process_handle_t *process_handle)
3943 {
3944   return process_handle->stdout_pipe;
3945 }
3946 #else
3947 /* DOCDOC tor_process_get_stdout_pipe */
3948 FILE *
3949 tor_process_get_stdout_pipe(process_handle_t *process_handle)
3950 {
3951   return process_handle->stdout_handle;
3952 }
3953 #endif
3954
3955 /* DOCDOC process_handle_new */
3956 static process_handle_t *
3957 process_handle_new(void)
3958 {
3959   process_handle_t *out = tor_malloc_zero(sizeof(process_handle_t));
3960
3961 #ifdef _WIN32
3962   out->stdin_pipe = INVALID_HANDLE_VALUE;
3963   out->stdout_pipe = INVALID_HANDLE_VALUE;
3964   out->stderr_pipe = INVALID_HANDLE_VALUE;
3965 #else
3966   out->stdin_pipe = -1;
3967   out->stdout_pipe = -1;
3968   out->stderr_pipe = -1;
3969 #endif
3970
3971   return out;
3972 }
3973
3974 #ifndef _WIN32
3975 /** Invoked when a process that we've launched via tor_spawn_background() has
3976  * been found to have terminated.
3977  */
3978 static void
3979 process_handle_waitpid_cb(int status, void *arg)
3980 {
3981   process_handle_t *process_handle = arg;
3982
3983   process_handle->waitpid_exit_status = status;
3984   clear_waitpid_callback(process_handle->waitpid_cb);
3985   if (process_handle->status == PROCESS_STATUS_RUNNING)
3986     process_handle->status = PROCESS_STATUS_NOTRUNNING;
3987   process_handle->waitpid_cb = 0;
3988 }
3989 #endif
3990
3991 /**
3992  * @name child-process states
3993  *
3994  * Each of these values represents a possible state that a child process can
3995  * be in.  They're used to determine what to say when telling the parent how
3996  * far along we were before failure.
3997  *
3998  * @{
3999  */
4000 #define CHILD_STATE_INIT 0
4001 #define CHILD_STATE_PIPE 1
4002 #define CHILD_STATE_MAXFD 2
4003 #define CHILD_STATE_FORK 3
4004 #define CHILD_STATE_DUPOUT 4
4005 #define CHILD_STATE_DUPERR 5
4006 #define CHILD_STATE_DUPIN 6
4007 #define CHILD_STATE_CLOSEFD 7
4008 #define CHILD_STATE_EXEC 8
4009 #define CHILD_STATE_FAILEXEC 9
4010 /** @} */
4011 /** Start a program in the background. If <b>filename</b> contains a '/', then
4012  * it will be treated as an absolute or relative path.  Otherwise, on
4013  * non-Windows systems, the system path will be searched for <b>filename</b>.
4014  * On Windows, only the current directory will be searched. Here, to search the
4015  * system path (as well as the application directory, current working
4016  * directory, and system directories), set filename to NULL.
4017  *
4018  * The strings in <b>argv</b> will be passed as the command line arguments of
4019  * the child program (following convention, argv[0] should normally be the
4020  * filename of the executable, and this must be the case if <b>filename</b> is
4021  * NULL). The last element of argv must be NULL. A handle to the child process
4022  * will be returned in process_handle (which must be non-NULL). Read
4023  * process_handle.status to find out if the process was successfully launched.
4024  * For convenience, process_handle.status is returned by this function.
4025  *
4026  * Some parts of this code are based on the POSIX subprocess module from
4027  * Python, and example code from
4028  * http://msdn.microsoft.com/en-us/library/ms682499%28v=vs.85%29.aspx.
4029  */
4030 int
4031 tor_spawn_background(const char *const filename, const char **argv,
4032                      process_environment_t *env,
4033                      process_handle_t **process_handle_out)
4034 {
4035 #ifdef _WIN32
4036   HANDLE stdout_pipe_read = NULL;
4037   HANDLE stdout_pipe_write = NULL;
4038   HANDLE stderr_pipe_read = NULL;
4039   HANDLE stderr_pipe_write = NULL;
4040   HANDLE stdin_pipe_read = NULL;
4041   HANDLE stdin_pipe_write = NULL;
4042   process_handle_t *process_handle;
4043   int status;
4044
4045   STARTUPINFOA siStartInfo;
4046   BOOL retval = FALSE;
4047
4048   SECURITY_ATTRIBUTES saAttr;
4049   char *joined_argv;
4050
4051   saAttr.nLength = sizeof(SECURITY_ATTRIBUTES);
4052   saAttr.bInheritHandle = TRUE;
4053   /* TODO: should we set explicit security attributes? (#2046, comment 5) */
4054   saAttr.lpSecurityDescriptor = NULL;
4055
4056   /* Assume failure to start process */
4057   status = PROCESS_STATUS_ERROR;
4058
4059   /* Set up pipe for stdout */
4060   if (!CreatePipe(&stdout_pipe_read, &stdout_pipe_write, &saAttr, 0)) {
4061     log_warn(LD_GENERAL,
4062       "Failed to create pipe for stdout communication with child process: %s",
4063       format_win32_error(GetLastError()));
4064     return status;
4065   }
4066   if (!SetHandleInformation(stdout_pipe_read, HANDLE_FLAG_INHERIT, 0)) {
4067     log_warn(LD_GENERAL,
4068       "Failed to configure pipe for stdout communication with child "
4069       "process: %s", format_win32_error(GetLastError()));
4070     return status;
4071   }
4072
4073   /* Set up pipe for stderr */
4074   if (!CreatePipe(&stderr_pipe_read, &stderr_pipe_write, &saAttr, 0)) {
4075     log_warn(LD_GENERAL,
4076       "Failed to create pipe for stderr communication with child process: %s",
4077       format_win32_error(GetLastError()));
4078     return status;
4079   }
4080   if (!SetHandleInformation(stderr_pipe_read, HANDLE_FLAG_INHERIT, 0)) {
4081     log_warn(LD_GENERAL,
4082       "Failed to configure pipe for stderr communication with child "
4083       "process: %s", format_win32_error(GetLastError()));
4084     return status;
4085   }
4086
4087   /* Set up pipe for stdin */
4088   if (!CreatePipe(&stdin_pipe_read, &stdin_pipe_write, &saAttr, 0)) {
4089     log_warn(LD_GENERAL,
4090       "Failed to create pipe for stdin communication with child process: %s",
4091       format_win32_error(GetLastError()));
4092     return status;
4093   }
4094   if (!SetHandleInformation(stdin_pipe_write, HANDLE_FLAG_INHERIT, 0)) {
4095     log_warn(LD_GENERAL,
4096       "Failed to configure pipe for stdin communication with child "
4097       "process: %s", format_win32_error(GetLastError()));
4098     return status;
4099   }
4100
4101   /* Create the child process */
4102
4103   /* Windows expects argv to be a whitespace delimited string, so join argv up
4104    */
4105   joined_argv = tor_join_win_cmdline(argv);
4106
4107   process_handle = process_handle_new();
4108   process_handle->status = status;
4109
4110   ZeroMemory(&(process_handle->pid), sizeof(PROCESS_INFORMATION));
4111   ZeroMemory(&siStartInfo, sizeof(STARTUPINFO));
4112   siStartInfo.cb = sizeof(STARTUPINFO);
4113   siStartInfo.hStdError = stderr_pipe_write;
4114   siStartInfo.hStdOutput = stdout_pipe_write;
4115   siStartInfo.hStdInput = stdin_pipe_read;
4116   siStartInfo.dwFlags |= STARTF_USESTDHANDLES;
4117
4118   /* Create the child process */
4119
4120   retval = CreateProcessA(filename,      // module name
4121                  joined_argv,   // command line
4122   /* TODO: should we set explicit security attributes? (#2046, comment 5) */
4123                  NULL,          // process security attributes
4124                  NULL,          // primary thread security attributes
4125                  TRUE,          // handles are inherited
4126   /*(TODO: set CREATE_NEW CONSOLE/PROCESS_GROUP to make GetExitCodeProcess()
4127    * work?) */
4128                  CREATE_NO_WINDOW,             // creation flags
4129                  (env==NULL) ? NULL : env->windows_environment_block,
4130                  NULL,          // use parent's current directory
4131                  &siStartInfo,  // STARTUPINFO pointer
4132                  &(process_handle->pid));  // receives PROCESS_INFORMATION
4133
4134   tor_free(joined_argv);
4135
4136   if (!retval) {
4137     log_warn(LD_GENERAL,
4138       "Failed to create child process %s: %s", filename?filename:argv[0],
4139       format_win32_error(GetLastError()));
4140     tor_free(process_handle);
4141   } else  {
4142     /* TODO: Close hProcess and hThread in process_handle->pid? */
4143     process_handle->stdout_pipe = stdout_pipe_read;
4144     process_handle->stderr_pipe = stderr_pipe_read;
4145     process_handle->stdin_pipe = stdin_pipe_write;
4146     status = process_handle->status = PROCESS_STATUS_RUNNING;
4147   }
4148
4149   /* TODO: Close pipes on exit */
4150   *process_handle_out = process_handle;
4151   return status;
4152 #else // _WIN32
4153   pid_t pid;
4154   int stdout_pipe[2];
4155   int stderr_pipe[2];
4156   int stdin_pipe[2];
4157   int fd, retval;
4158   ssize_t nbytes;
4159   process_handle_t *process_handle;
4160   int status;
4161
4162   const char *error_message = SPAWN_ERROR_MESSAGE;
4163   size_t error_message_length;
4164
4165   /* Represents where in the process of spawning the program is;
4166      this is used for printing out the error message */
4167   unsigned char child_state = CHILD_STATE_INIT;
4168
4169   char hex_errno[HEX_ERRNO_SIZE + 2]; /* + 1 should be sufficient actually */
4170
4171   static int max_fd = -1;
4172
4173   status = PROCESS_STATUS_ERROR;
4174
4175   /* We do the strlen here because strlen() is not signal handler safe,
4176      and we are not allowed to use unsafe functions between fork and exec */
4177   error_message_length = strlen(error_message);
4178
4179   child_state = CHILD_STATE_PIPE;
4180
4181   /* Set up pipe for redirecting stdout, stderr, and stdin of child */
4182   retval = pipe(stdout_pipe);
4183   if (-1 == retval) {
4184     log_warn(LD_GENERAL,
4185       "Failed to set up pipe for stdout communication with child process: %s",
4186        strerror(errno));
4187     return status;
4188   }
4189
4190   retval = pipe(stderr_pipe);
4191   if (-1 == retval) {
4192     log_warn(LD_GENERAL,
4193       "Failed to set up pipe for stderr communication with child process: %s",
4194       strerror(errno));
4195
4196     close(stdout_pipe[0]);
4197     close(stdout_pipe[1]);
4198
4199     return status;
4200   }
4201
4202   retval = pipe(stdin_pipe);
4203   if (-1 == retval) {
4204     log_warn(LD_GENERAL,
4205       "Failed to set up pipe for stdin communication with child process: %s",
4206        strerror(errno));
4207
4208     close(stdout_pipe[0]);
4209     close(stdout_pipe[1]);
4210     close(stderr_pipe[0]);
4211     close(stderr_pipe[1]);
4212
4213     return status;
4214   }
4215
4216   child_state = CHILD_STATE_MAXFD;
4217
4218 #ifdef _SC_OPEN_MAX
4219   if (-1 == max_fd) {
4220     max_fd = (int) sysconf(_SC_OPEN_MAX);
4221     if (max_fd == -1) {
4222       max_fd = DEFAULT_MAX_FD;
4223       log_warn(LD_GENERAL,
4224                "Cannot find maximum file descriptor, assuming %d", max_fd);
4225     }
4226   }
4227 #else
4228   max_fd = DEFAULT_MAX_FD;
4229 #endif
4230
4231   child_state = CHILD_STATE_FORK;
4232
4233   pid = fork();
4234   if (0 == pid) {
4235     /* In child */
4236
4237 #if defined(HAVE_SYS_PRCTL_H) && defined(__linux__)
4238     /* Attempt to have the kernel issue a SIGTERM if the parent
4239      * goes away. Certain attributes of the binary being execve()ed
4240      * will clear this during the execve() call, but it's better
4241      * than nothing.
4242      */
4243     prctl(PR_SET_PDEATHSIG, SIGTERM);
4244 #endif
4245
4246     child_state = CHILD_STATE_DUPOUT;
4247
4248     /* Link child stdout to the write end of the pipe */
4249     retval = dup2(stdout_pipe[1], STDOUT_FILENO);
4250     if (-1 == retval)
4251         goto error;
4252
4253     child_state = CHILD_STATE_DUPERR;
4254
4255     /* Link child stderr to the write end of the pipe */
4256     retval = dup2(stderr_pipe[1], STDERR_FILENO);
4257     if (-1 == retval)
4258         goto error;
4259
4260     child_state = CHILD_STATE_DUPIN;
4261
4262     /* Link child stdin to the read end of the pipe */
4263     retval = dup2(stdin_pipe[0], STDIN_FILENO);
4264     if (-1 == retval)
4265       goto error;
4266
4267     child_state = CHILD_STATE_CLOSEFD;
4268
4269     close(stderr_pipe[0]);
4270     close(stderr_pipe[1]);
4271     close(stdout_pipe[0]);
4272     close(stdout_pipe[1]);
4273     close(stdin_pipe[0]);
4274     close(stdin_pipe[1]);
4275
4276     /* Close all other fds, including the read end of the pipe */
4277     /* XXX: We should now be doing enough FD_CLOEXEC setting to make
4278      * this needless. */
4279     for (fd = STDERR_FILENO + 1; fd < max_fd; fd++) {
4280       close(fd);
4281     }
4282
4283     child_state = CHILD_STATE_EXEC;
4284
4285     /* Call the requested program. We need the cast because
4286        execvp doesn't define argv as const, even though it
4287        does not modify the arguments */
4288     if (env)
4289       execve(filename, (char *const *) argv, env->unixoid_environment_block);
4290     else {
4291       static char *new_env[] = { NULL };
4292       execve(filename, (char *const *) argv, new_env);
4293     }
4294
4295     /* If we got here, the exec or open(/dev/null) failed */
4296
4297     child_state = CHILD_STATE_FAILEXEC;
4298
4299   error:
4300     {
4301       /* XXX: are we leaking fds from the pipe? */
4302       int n;
4303
4304       n = format_helper_exit_status(child_state, errno, hex_errno);
4305
4306       if (n >= 0) {
4307         /* Write the error message. GCC requires that we check the return
4308            value, but there is nothing we can do if it fails */
4309         /* TODO: Don't use STDOUT, use a pipe set up just for this purpose */
4310         nbytes = write(STDOUT_FILENO, error_message, error_message_length);
4311         nbytes = write(STDOUT_FILENO, hex_errno, n);
4312       }
4313     }
4314
4315     (void) nbytes;
4316
4317     _exit(255);
4318     /* Never reached, but avoids compiler warning */
4319     return status;
4320   }
4321
4322   /* In parent */
4323
4324   if (-1 == pid) {
4325     log_warn(LD_GENERAL, "Failed to fork child process: %s", strerror(errno));
4326     close(stdin_pipe[0]);
4327     close(stdin_pipe[1]);
4328     close(stdout_pipe[0]);
4329     close(stdout_pipe[1]);
4330     close(stderr_pipe[0]);
4331     close(stderr_pipe[1]);
4332     return status;
4333   }
4334
4335   process_handle = process_handle_new();
4336   process_handle->status = status;
4337   process_handle->pid = pid;
4338
4339   /* TODO: If the child process forked but failed to exec, waitpid it */
4340
4341   /* Return read end of the pipes to caller, and close write end */
4342   process_handle->stdout_pipe = stdout_pipe[0];
4343   retval = close(stdout_pipe[1]);
4344
4345   if (-1 == retval) {
4346     log_warn(LD_GENERAL,
4347             "Failed to close write end of stdout pipe in parent process: %s",
4348             strerror(errno));
4349   }
4350
4351   process_handle->waitpid_cb = set_waitpid_callback(pid,
4352                                                     process_handle_waitpid_cb,
4353                                                     process_handle);
4354
4355   process_handle->stderr_pipe = stderr_pipe[0];
4356   retval = close(stderr_pipe[1]);
4357
4358   if (-1 == retval) {
4359     log_warn(LD_GENERAL,
4360             "Failed to close write end of stderr pipe in parent process: %s",
4361             strerror(errno));
4362   }
4363
4364   /* Return write end of the stdin pipe to caller, and close the read end */
4365   process_handle->stdin_pipe = stdin_pipe[1];
4366   retval = close(stdin_pipe[0]);
4367
4368   if (-1 == retval) {
4369     log_warn(LD_GENERAL,
4370             "Failed to close read end of stdin pipe in parent process: %s",
4371             strerror(errno));
4372   }
4373
4374   status = process_handle->status = PROCESS_STATUS_RUNNING;
4375   /* Set stdin/stdout/stderr pipes to be non-blocking */
4376   if (fcntl(process_handle->stdout_pipe, F_SETFL, O_NONBLOCK) < 0 ||
4377       fcntl(process_handle->stderr_pipe, F_SETFL, O_NONBLOCK) < 0 ||
4378       fcntl(process_handle->stdin_pipe, F_SETFL, O_NONBLOCK) < 0) {
4379     log_warn(LD_GENERAL, "Failed to set stderror/stdout/stdin pipes "
4380              "nonblocking in parent process: %s", strerror(errno));
4381   }
4382   /* Open the buffered IO streams */
4383   process_handle->stdout_handle = fdopen(process_handle->stdout_pipe, "r");
4384   process_handle->stderr_handle = fdopen(process_handle->stderr_pipe, "r");
4385   process_handle->stdin_handle = fdopen(process_handle->stdin_pipe, "r");
4386
4387   *process_handle_out = process_handle;
4388   return process_handle->status;
4389 #endif // _WIN32
4390 }
4391
4392 /** Destroy all resources allocated by the process handle in
4393  *  <b>process_handle</b>.
4394  *  If <b>also_terminate_process</b> is true, also terminate the
4395  *  process of the process handle. */
4396 MOCK_IMPL(void,
4397 tor_process_handle_destroy,(process_handle_t *process_handle,
4398                             int also_terminate_process))
4399 {
4400   if (!process_handle)
4401     return;
4402
4403   if (also_terminate_process) {
4404     if (tor_terminate_process(process_handle) < 0) {
4405       const char *errstr =
4406 #ifdef _WIN32
4407         format_win32_error(GetLastError());
4408 #else
4409         strerror(errno);
4410 #endif
4411       log_notice(LD_GENERAL, "Failed to terminate process with "
4412                  "PID '%d' ('%s').", tor_process_get_pid(process_handle),
4413                  errstr);
4414     } else {
4415       log_info(LD_GENERAL, "Terminated process with PID '%d'.",
4416                tor_process_get_pid(process_handle));
4417     }
4418   }
4419
4420   process_handle->status = PROCESS_STATUS_NOTRUNNING;
4421
4422 #ifdef _WIN32
4423   if (process_handle->stdout_pipe)
4424     CloseHandle(process_handle->stdout_pipe);
4425
4426   if (process_handle->stderr_pipe)
4427     CloseHandle(process_handle->stderr_pipe);
4428
4429   if (process_handle->stdin_pipe)
4430     CloseHandle(process_handle->stdin_pipe);
4431 #else
4432   if (process_handle->stdout_handle)
4433     fclose(process_handle->stdout_handle);
4434
4435   if (process_handle->stderr_handle)
4436     fclose(process_handle->stderr_handle);
4437
4438   if (process_handle->stdin_handle)
4439     fclose(process_handle->stdin_handle);
4440
4441   clear_waitpid_callback(process_handle->waitpid_cb);
4442 #endif
4443
4444   memset(process_handle, 0x0f, sizeof(process_handle_t));
4445   tor_free(process_handle);
4446 }
4447
4448 /** Get the exit code of a process specified by <b>process_handle</b> and store
4449  * it in <b>exit_code</b>, if set to a non-NULL value.  If <b>block</b> is set
4450  * to true, the call will block until the process has exited.  Otherwise if
4451  * the process is still running, the function will return
4452  * PROCESS_EXIT_RUNNING, and exit_code will be left unchanged. Returns
4453  * PROCESS_EXIT_EXITED if the process did exit. If there is a failure,
4454  * PROCESS_EXIT_ERROR will be returned and the contents of exit_code (if
4455  * non-NULL) will be undefined. N.B. Under *nix operating systems, this will
4456  * probably not work in Tor, because waitpid() is called in main.c to reap any
4457  * terminated child processes.*/
4458 int
4459 tor_get_exit_code(process_handle_t *process_handle,
4460                   int block, int *exit_code)
4461 {
4462 #ifdef _WIN32
4463   DWORD retval;
4464   BOOL success;
4465
4466   if (block) {
4467     /* Wait for the process to exit */
4468     retval = WaitForSingleObject(process_handle->pid.hProcess, INFINITE);
4469     if (retval != WAIT_OBJECT_0) {
4470       log_warn(LD_GENERAL, "WaitForSingleObject() failed (%d): %s",
4471               (int)retval, format_win32_error(GetLastError()));
4472       return PROCESS_EXIT_ERROR;
4473     }
4474   } else {
4475     retval = WaitForSingleObject(process_handle->pid.hProcess, 0);
4476     if (WAIT_TIMEOUT == retval) {
4477       /* Process has not exited */
4478       return PROCESS_EXIT_RUNNING;
4479     } else if (retval != WAIT_OBJECT_0) {
4480       log_warn(LD_GENERAL, "WaitForSingleObject() failed (%d): %s",
4481                (int)retval, format_win32_error(GetLastError()));
4482       return PROCESS_EXIT_ERROR;
4483     }
4484   }
4485
4486   if (exit_code != NULL) {
4487     success = GetExitCodeProcess(process_handle->pid.hProcess,
4488                                  (PDWORD)exit_code);
4489     if (!success) {
4490       log_warn(LD_GENERAL, "GetExitCodeProcess() failed: %s",
4491                format_win32_error(GetLastError()));
4492       return PROCESS_EXIT_ERROR;
4493     }
4494   }
4495 #else
4496   int stat_loc;
4497   int retval;
4498
4499   if (process_handle->waitpid_cb) {
4500     /* We haven't processed a SIGCHLD yet. */
4501     retval = waitpid(process_handle->pid, &stat_loc, block?0:WNOHANG);
4502     if (retval == process_handle->pid) {
4503       clear_waitpid_callback(process_handle->waitpid_cb);
4504       process_handle->waitpid_cb = NULL;
4505       process_handle->waitpid_exit_status = stat_loc;
4506     }
4507   } else {
4508     /* We already got a SIGCHLD for this process, and handled it. */
4509     retval = process_handle->pid;
4510     stat_loc = process_handle->waitpid_exit_status;
4511   }
4512
4513   if (!block && 0 == retval) {
4514     /* Process has not exited */
4515     return PROCESS_EXIT_RUNNING;
4516   } else if (retval != process_handle->pid) {
4517     log_warn(LD_GENERAL, "waitpid() failed for PID %d: %s",
4518              process_handle->pid, strerror(errno));
4519     return PROCESS_EXIT_ERROR;
4520   }
4521
4522   if (!WIFEXITED(stat_loc)) {
4523     log_warn(LD_GENERAL, "Process %d did not exit normally",
4524              process_handle->pid);
4525     return PROCESS_EXIT_ERROR;
4526   }
4527
4528   if (exit_code != NULL)
4529     *exit_code = WEXITSTATUS(stat_loc);
4530 #endif // _WIN32
4531
4532   return PROCESS_EXIT_EXITED;
4533 }
4534
4535 /** Helper: return the number of characters in <b>s</b> preceding the first
4536  * occurrence of <b>ch</b>. If <b>ch</b> does not occur in <b>s</b>, return
4537  * the length of <b>s</b>. Should be equivalent to strspn(s, "ch"). */
4538 static INLINE size_t
4539 str_num_before(const char *s, char ch)
4540 {
4541   const char *cp = strchr(s, ch);
4542   if (cp)
4543     return cp - s;
4544   else
4545     return strlen(s);
4546 }
4547
4548 /** Return non-zero iff getenv would consider <b>s1</b> and <b>s2</b>
4549  * to have the same name as strings in a process's environment. */
4550 int
4551 environment_variable_names_equal(const char *s1, const char *s2)
4552 {
4553   size_t s1_name_len = str_num_before(s1, '=');
4554   size_t s2_name_len = str_num_before(s2, '=');
4555
4556   return (s1_name_len == s2_name_len &&
4557           tor_memeq(s1, s2, s1_name_len));
4558 }
4559
4560 /** Free <b>env</b> (assuming it was produced by
4561  * process_environment_make). */
4562 void
4563 process_environment_free(process_environment_t *env)
4564 {
4565   if (env == NULL) return;
4566
4567   /* As both an optimization hack to reduce consing on Unixoid systems
4568    * and a nice way to ensure that some otherwise-Windows-specific
4569    * code will always get tested before changes to it get merged, the
4570    * strings which env->unixoid_environment_block points to are packed
4571    * into env->windows_environment_block. */
4572   tor_free(env->unixoid_environment_block);
4573   tor_free(env->windows_environment_block);
4574
4575   tor_free(env);
4576 }
4577
4578 /** Make a process_environment_t containing the environment variables
4579  * specified in <b>env_vars</b> (as C strings of the form
4580  * "NAME=VALUE"). */
4581 process_environment_t *
4582 process_environment_make(struct smartlist_t *env_vars)
4583 {
4584   process_environment_t *env = tor_malloc_zero(sizeof(process_environment_t));
4585   size_t n_env_vars = smartlist_len(env_vars);
4586   size_t i;
4587   size_t total_env_length;
4588   smartlist_t *env_vars_sorted;
4589
4590   tor_assert(n_env_vars + 1 != 0);
4591   env->unixoid_environment_block = tor_calloc(n_env_vars + 1, sizeof(char *));
4592   /* env->unixoid_environment_block is already NULL-terminated,
4593    * because we assume that NULL == 0 (and check that during compilation). */
4594
4595   total_env_length = 1; /* terminating NUL of terminating empty string */
4596   for (i = 0; i < n_env_vars; ++i) {
4597     const char *s = smartlist_get(env_vars, i);
4598     size_t slen = strlen(s);
4599
4600     tor_assert(slen + 1 != 0);
4601     tor_assert(slen + 1 < SIZE_MAX - total_env_length);
4602     total_env_length += slen + 1;
4603   }
4604
4605   env->windows_environment_block = tor_malloc_zero(total_env_length);
4606   /* env->windows_environment_block is already
4607    * (NUL-terminated-empty-string)-terminated. */
4608
4609   /* Some versions of Windows supposedly require that environment
4610    * blocks be sorted.  Or maybe some Windows programs (or their
4611    * runtime libraries) fail to look up strings in non-sorted
4612    * environment blocks.
4613    *
4614    * Also, sorting strings makes it easy to find duplicate environment
4615    * variables and environment-variable strings without an '=' on all
4616    * OSes, and they can cause badness.  Let's complain about those. */
4617   env_vars_sorted = smartlist_new();
4618   smartlist_add_all(env_vars_sorted, env_vars);
4619   smartlist_sort_strings(env_vars_sorted);
4620
4621   /* Now copy the strings into the environment blocks. */
4622   {
4623     char *cp = env->windows_environment_block;
4624     const char *prev_env_var = NULL;
4625
4626     for (i = 0; i < n_env_vars; ++i) {
4627       const char *s = smartlist_get(env_vars_sorted, i);
4628       size_t slen = strlen(s);
4629       size_t s_name_len = str_num_before(s, '=');
4630
4631       if (s_name_len == slen) {
4632         log_warn(LD_GENERAL,
4633                  "Preparing an environment containing a variable "
4634                  "without a value: %s",
4635                  s);
4636       }
4637       if (prev_env_var != NULL &&
4638           environment_variable_names_equal(s, prev_env_var)) {
4639         log_warn(LD_GENERAL,
4640                  "Preparing an environment containing two variables "
4641                  "with the same name: %s and %s",
4642                  prev_env_var, s);
4643       }
4644
4645       prev_env_var = s;
4646
4647       /* Actually copy the string into the environment. */
4648       memcpy(cp, s, slen+1);
4649       env->unixoid_environment_block[i] = cp;
4650       cp += slen+1;
4651     }
4652
4653     tor_assert(cp == env->windows_environment_block + total_env_length - 1);
4654   }
4655
4656   smartlist_free(env_vars_sorted);
4657
4658   return env;
4659 }
4660
4661 /** Return a newly allocated smartlist containing every variable in
4662  * this process's environment, as a NUL-terminated string of the form
4663  * "NAME=VALUE".  Note that on some/many/most/all OSes, the parent
4664  * process can put strings not of that form in our environment;
4665  * callers should try to not get crashed by that.
4666  *
4667  * The returned strings are heap-allocated, and must be freed by the
4668  * caller. */
4669 struct smartlist_t *
4670 get_current_process_environment_variables(void)
4671 {
4672   smartlist_t *sl = smartlist_new();
4673
4674   char **environ_tmp; /* Not const char ** ? Really? */
4675   for (environ_tmp = get_environment(); *environ_tmp; ++environ_tmp) {
4676     smartlist_add(sl, tor_strdup(*environ_tmp));
4677   }
4678
4679   return sl;
4680 }
4681
4682 /** For each string s in <b>env_vars</b> such that
4683  * environment_variable_names_equal(s, <b>new_var</b>), remove it; if
4684  * <b>free_p</b> is non-zero, call <b>free_old</b>(s).  If
4685  * <b>new_var</b> contains '=', insert it into <b>env_vars</b>. */
4686 void
4687 set_environment_variable_in_smartlist(struct smartlist_t *env_vars,
4688                                       const char *new_var,
4689                                       void (*free_old)(void*),
4690                                       int free_p)
4691 {
4692   SMARTLIST_FOREACH_BEGIN(env_vars, const char *, s) {
4693     if (environment_variable_names_equal(s, new_var)) {
4694       SMARTLIST_DEL_CURRENT(env_vars, s);
4695       if (free_p) {
4696         free_old((void *)s);
4697       }
4698     }
4699   } SMARTLIST_FOREACH_END(s);
4700
4701   if (strchr(new_var, '=') != NULL) {
4702     smartlist_add(env_vars, (void *)new_var);
4703   }
4704 }
4705
4706 #ifdef _WIN32
4707 /** Read from a handle <b>h</b> into <b>buf</b>, up to <b>count</b> bytes.  If
4708  * <b>hProcess</b> is NULL, the function will return immediately if there is
4709  * nothing more to read. Otherwise <b>hProcess</b> should be set to the handle
4710  * to the process owning the <b>h</b>. In this case, the function will exit
4711  * only once the process has exited, or <b>count</b> bytes are read. Returns
4712  * the number of bytes read, or -1 on error. */
4713 ssize_t
4714 tor_read_all_handle(HANDLE h, char *buf, size_t count,
4715                     const process_handle_t *process)
4716 {
4717   size_t numread = 0;
4718   BOOL retval;
4719   DWORD byte_count;
4720   BOOL process_exited = FALSE;
4721
4722   if (count > SIZE_T_CEILING || count > SSIZE_MAX)
4723     return -1;
4724
4725   while (numread != count) {
4726     /* Check if there is anything to read */
4727     retval = PeekNamedPipe(h, NULL, 0, NULL, &byte_count, NULL);
4728     if (!retval) {
4729       log_warn(LD_GENERAL,
4730         "Failed to peek from handle: %s",
4731         format_win32_error(GetLastError()));
4732       return -1;
4733     } else if (0 == byte_count) {
4734       /* Nothing available: process exited or it is busy */
4735
4736       /* Exit if we don't know whether the process is running */
4737       if (NULL == process)
4738         break;
4739
4740       /* The process exited and there's nothing left to read from it */
4741       if (process_exited)
4742         break;
4743
4744       /* If process is not running, check for output one more time in case
4745          it wrote something after the peek was performed. Otherwise keep on
4746          waiting for output */
4747       tor_assert(process != NULL);
4748       byte_count = WaitForSingleObject(process->pid.hProcess, 0);
4749       if (WAIT_TIMEOUT != byte_count)
4750         process_exited = TRUE;
4751
4752       continue;
4753     }
4754
4755     /* There is data to read; read it */
4756     retval = ReadFile(h, buf+numread, count-numread, &byte_count, NULL);
4757     tor_assert(byte_count + numread <= count);
4758     if (!retval) {
4759       log_warn(LD_GENERAL, "Failed to read from handle: %s",
4760         format_win32_error(GetLastError()));
4761       return -1;
4762     } else if (0 == byte_count) {
4763       /* End of file */
4764       break;
4765     }
4766     numread += byte_count;
4767   }
4768   return (ssize_t)numread;
4769 }
4770 #else
4771 /** Read from a handle <b>h</b> into <b>buf</b>, up to <b>count</b> bytes.  If
4772  * <b>process</b> is NULL, the function will return immediately if there is
4773  * nothing more to read. Otherwise data will be read until end of file, or
4774  * <b>count</b> bytes are read.  Returns the number of bytes read, or -1 on
4775  * error. Sets <b>eof</b> to true if <b>eof</b> is not NULL and the end of the
4776  * file has been reached. */
4777 ssize_t
4778 tor_read_all_handle(FILE *h, char *buf, size_t count,
4779                     const process_handle_t *process,
4780                     int *eof)
4781 {
4782   size_t numread = 0;
4783   char *retval;
4784
4785   if (eof)
4786     *eof = 0;
4787
4788   if (count > SIZE_T_CEILING || count > SSIZE_MAX)
4789     return -1;
4790
4791   while (numread != count) {
4792     /* Use fgets because that is what we use in log_from_pipe() */
4793     retval = fgets(buf+numread, (int)(count-numread), h);
4794     if (NULL == retval) {
4795       if (feof(h)) {
4796         log_debug(LD_GENERAL, "fgets() reached end of file");
4797         if (eof)
4798           *eof = 1;
4799         break;
4800       } else {
4801         if (EAGAIN == errno) {
4802           if (process)
4803             continue;
4804           else
4805             break;
4806         } else {
4807           log_warn(LD_GENERAL, "fgets() from handle failed: %s",
4808                    strerror(errno));
4809           return -1;
4810         }
4811       }
4812     }
4813     tor_assert(retval != NULL);
4814     tor_assert(strlen(retval) + numread <= count);
4815     numread += strlen(retval);
4816   }
4817
4818   log_debug(LD_GENERAL, "fgets() read %d bytes from handle", (int)numread);
4819   return (ssize_t)numread;
4820 }
4821 #endif
4822
4823 /** Read from stdout of a process until the process exits. */
4824 ssize_t
4825 tor_read_all_from_process_stdout(const process_handle_t *process_handle,
4826                                  char *buf, size_t count)
4827 {
4828 #ifdef _WIN32
4829   return tor_read_all_handle(process_handle->stdout_pipe, buf, count,
4830                              process_handle);
4831 #else
4832   return tor_read_all_handle(process_handle->stdout_handle, buf, count,
4833                              process_handle, NULL);
4834 #endif
4835 }
4836
4837 /** Read from stdout of a process until the process exits. */
4838 ssize_t
4839 tor_read_all_from_process_stderr(const process_handle_t *process_handle,
4840                                  char *buf, size_t count)
4841 {
4842 #ifdef _WIN32
4843   return tor_read_all_handle(process_handle->stderr_pipe, buf, count,
4844                              process_handle);
4845 #else
4846   return tor_read_all_handle(process_handle->stderr_handle, buf, count,
4847                              process_handle, NULL);
4848 #endif
4849 }
4850
4851 /** Split buf into lines, and add to smartlist. The buffer <b>buf</b> will be
4852  * modified. The resulting smartlist will consist of pointers to buf, so there
4853  * is no need to free the contents of sl. <b>buf</b> must be a NUL-terminated
4854  * string. <b>len</b> should be set to the length of the buffer excluding the
4855  * NUL. Non-printable characters (including NUL) will be replaced with "." */
4856 int
4857 tor_split_lines(smartlist_t *sl, char *buf, int len)
4858 {
4859   /* Index in buf of the start of the current line */
4860   int start = 0;
4861   /* Index in buf of the current character being processed */
4862   int cur = 0;
4863   /* Are we currently in a line */
4864   char in_line = 0;
4865
4866   /* Loop over string */
4867   while (cur < len) {
4868     /* Loop until end of line or end of string */
4869     for (; cur < len; cur++) {
4870       if (in_line) {
4871         if ('\r' == buf[cur] || '\n' == buf[cur]) {
4872           /* End of line */
4873           buf[cur] = '\0';
4874           /* Point cur to the next line */
4875           cur++;
4876           /* Line starts at start and ends with a nul */
4877           break;
4878         } else {
4879           if (!TOR_ISPRINT(buf[cur]))
4880             buf[cur] = '.';
4881         }
4882       } else {
4883         if ('\r' == buf[cur] || '\n' == buf[cur]) {
4884           /* Skip leading vertical space */
4885           ;
4886         } else {
4887           in_line = 1;
4888           start = cur;
4889           if (!TOR_ISPRINT(buf[cur]))
4890             buf[cur] = '.';
4891         }
4892       }
4893     }
4894     /* We are at the end of the line or end of string. If in_line is true there
4895      * is a line which starts at buf+start and ends at a NUL. cur points to
4896      * the character after the NUL. */
4897     if (in_line)
4898       smartlist_add(sl, (void *)(buf+start));
4899     in_line = 0;
4900   }
4901   return smartlist_len(sl);
4902 }
4903
4904 /** Return a string corresponding to <b>stream_status</b>. */
4905 const char *
4906 stream_status_to_string(enum stream_status stream_status)
4907 {
4908   switch (stream_status) {
4909     case IO_STREAM_OKAY:
4910       return "okay";
4911     case IO_STREAM_EAGAIN:
4912       return "temporarily unavailable";
4913     case IO_STREAM_TERM:
4914       return "terminated";
4915     case IO_STREAM_CLOSED:
4916       return "closed";
4917     default:
4918       tor_fragile_assert();
4919       return "unknown";
4920   }
4921 }
4922
4923 /* DOCDOC */
4924 static void
4925 log_portfw_spawn_error_message(const char *buf,
4926                                const char *executable, int *child_status)
4927 {
4928   /* Parse error message */
4929   int retval, child_state, saved_errno;
4930   retval = tor_sscanf(buf, SPAWN_ERROR_MESSAGE "%x/%x",
4931                       &child_state, &saved_errno);
4932   if (retval == 2) {
4933     log_warn(LD_GENERAL,
4934              "Failed to start child process \"%s\" in state %d: %s",
4935              executable, child_state, strerror(saved_errno));
4936     if (child_status)
4937       *child_status = 1;
4938   } else {
4939     /* Failed to parse message from child process, log it as a
4940        warning */
4941     log_warn(LD_GENERAL,
4942              "Unexpected message from port forwarding helper \"%s\": %s",
4943              executable, buf);
4944   }
4945 }
4946
4947 #ifdef _WIN32
4948
4949 /** Return a smartlist containing lines outputted from
4950  *  <b>handle</b>. Return NULL on error, and set
4951  *  <b>stream_status_out</b> appropriately. */
4952 MOCK_IMPL(smartlist_t *,
4953 tor_get_lines_from_handle, (HANDLE *handle,
4954                             enum stream_status *stream_status_out))
4955 {
4956   int pos;
4957   char stdout_buf[600] = {0};
4958   smartlist_t *lines = NULL;
4959
4960   tor_assert(stream_status_out);
4961
4962   *stream_status_out = IO_STREAM_TERM;
4963
4964   pos = tor_read_all_handle(handle, stdout_buf, sizeof(stdout_buf) - 1, NULL);
4965   if (pos < 0) {
4966     *stream_status_out = IO_STREAM_TERM;
4967     return NULL;
4968   }
4969   if (pos == 0) {
4970     *stream_status_out = IO_STREAM_EAGAIN;
4971     return NULL;
4972   }
4973
4974   /* End with a null even if there isn't a \r\n at the end */
4975   /* TODO: What if this is a partial line? */
4976   stdout_buf[pos] = '\0';
4977
4978   /* Split up the buffer */
4979   lines = smartlist_new();
4980   tor_split_lines(lines, stdout_buf, pos);
4981
4982   /* Currently 'lines' is populated with strings residing on the
4983      stack. Replace them with their exact copies on the heap: */
4984   SMARTLIST_FOREACH(lines, char *, line,
4985                     SMARTLIST_REPLACE_CURRENT(lines, line, tor_strdup(line)));
4986
4987   *stream_status_out = IO_STREAM_OKAY;
4988
4989   return lines;
4990 }
4991
4992 /** Read from stream, and send lines to log at the specified log level.
4993  * Returns -1 if there is a error reading, and 0 otherwise.
4994  * If the generated stream is flushed more often than on new lines, or
4995  * a read exceeds 256 bytes, lines will be truncated. This should be fixed,
4996  * along with the corresponding problem on *nix (see bug #2045).
4997  */
4998 static int
4999 log_from_handle(HANDLE *pipe, int severity)
5000 {
5001   char buf[256];
5002   int pos;
5003   smartlist_t *lines;
5004
5005   pos = tor_read_all_handle(pipe, buf, sizeof(buf) - 1, NULL);
5006   if (pos < 0) {
5007     /* Error */
5008     log_warn(LD_GENERAL, "Failed to read data from subprocess");
5009     return -1;
5010   }
5011
5012   if (0 == pos) {
5013     /* There's nothing to read (process is busy or has exited) */
5014     log_debug(LD_GENERAL, "Subprocess had nothing to say");
5015     return 0;
5016   }
5017
5018   /* End with a null even if there isn't a \r\n at the end */
5019   /* TODO: What if this is a partial line? */
5020   buf[pos] = '\0';
5021   log_debug(LD_GENERAL, "Subprocess had %d bytes to say", pos);
5022
5023   /* Split up the buffer */
5024   lines = smartlist_new();
5025   tor_split_lines(lines, buf, pos);
5026
5027   /* Log each line */
5028   SMARTLIST_FOREACH(lines, char *, line,
5029   {
5030     log_fn(severity, LD_GENERAL, "Port forwarding helper says: %s", line);
5031   });
5032   smartlist_free(lines);
5033
5034   return 0;
5035 }
5036
5037 #else
5038
5039 /** Return a smartlist containing lines outputted from
5040  *  <b>handle</b>. Return NULL on error, and set
5041  *  <b>stream_status_out</b> appropriately. */
5042 MOCK_IMPL(smartlist_t *,
5043 tor_get_lines_from_handle, (FILE *handle,
5044                             enum stream_status *stream_status_out))
5045 {
5046   enum stream_status stream_status;
5047   char stdout_buf[400];
5048   smartlist_t *lines = NULL;
5049
5050   while (1) {
5051     memset(stdout_buf, 0, sizeof(stdout_buf));
5052
5053     stream_status = get_string_from_pipe(handle,
5054                                          stdout_buf, sizeof(stdout_buf) - 1);
5055     if (stream_status != IO_STREAM_OKAY)
5056       goto done;
5057
5058     if (!lines) lines = smartlist_new();
5059     smartlist_add(lines, tor_strdup(stdout_buf));
5060   }
5061
5062  done:
5063   *stream_status_out = stream_status;
5064   return lines;
5065 }
5066
5067 /** Read from stream, and send lines to log at the specified log level.
5068  * Returns 1 if stream is closed normally, -1 if there is a error reading, and
5069  * 0 otherwise. Handles lines from tor-fw-helper and
5070  * tor_spawn_background() specially.
5071  */
5072 static int
5073 log_from_pipe(FILE *stream, int severity, const char *executable,
5074               int *child_status)
5075 {
5076   char buf[256];
5077   enum stream_status r;
5078
5079   for (;;) {
5080     r = get_string_from_pipe(stream, buf, sizeof(buf) - 1);
5081
5082     if (r == IO_STREAM_CLOSED) {
5083       return 1;
5084     } else if (r == IO_STREAM_EAGAIN) {
5085       return 0;
5086     } else if (r == IO_STREAM_TERM) {
5087       return -1;
5088     }
5089
5090     tor_assert(r == IO_STREAM_OKAY);
5091
5092     /* Check if buf starts with SPAWN_ERROR_MESSAGE */
5093     if (strcmpstart(buf, SPAWN_ERROR_MESSAGE) == 0) {
5094       log_portfw_spawn_error_message(buf, executable, child_status);
5095     } else {
5096       log_fn(severity, LD_GENERAL, "Port forwarding helper says: %s", buf);
5097     }
5098   }
5099
5100   /* We should never get here */
5101   return -1;
5102 }
5103 #endif
5104
5105 /** Reads from <b>stream</b> and stores input in <b>buf_out</b> making
5106  *  sure it's below <b>count</b> bytes.
5107  *  If the string has a trailing newline, we strip it off.
5108  *
5109  * This function is specifically created to handle input from managed
5110  * proxies, according to the pluggable transports spec. Make sure it
5111  * fits your needs before using it.
5112  *
5113  * Returns:
5114  * IO_STREAM_CLOSED: If the stream is closed.
5115  * IO_STREAM_EAGAIN: If there is nothing to read and we should check back
5116  *  later.
5117  * IO_STREAM_TERM: If something is wrong with the stream.
5118  * IO_STREAM_OKAY: If everything went okay and we got a string
5119  *  in <b>buf_out</b>. */
5120 enum stream_status
5121 get_string_from_pipe(FILE *stream, char *buf_out, size_t count)
5122 {
5123   char *retval;
5124   size_t len;
5125
5126   tor_assert(count <= INT_MAX);
5127
5128   retval = fgets(buf_out, (int)count, stream);
5129
5130   if (!retval) {
5131     if (feof(stream)) {
5132       /* Program has closed stream (probably it exited) */
5133       /* TODO: check error */
5134       return IO_STREAM_CLOSED;
5135     } else {
5136       if (EAGAIN == errno) {
5137         /* Nothing more to read, try again next time */
5138         return IO_STREAM_EAGAIN;
5139       } else {
5140         /* There was a problem, abandon this child process */
5141         return IO_STREAM_TERM;
5142       }
5143     }
5144   } else {
5145     len = strlen(buf_out);
5146     if (len == 0) {
5147       /* this probably means we got a NUL at the start of the string. */
5148       return IO_STREAM_EAGAIN;
5149     }
5150
5151     if (buf_out[len - 1] == '\n') {
5152       /* Remove the trailing newline */
5153       buf_out[len - 1] = '\0';
5154     } else {
5155       /* No newline; check whether we overflowed the buffer */
5156       if (!feof(stream))
5157         log_info(LD_GENERAL,
5158                  "Line from stream was truncated: %s", buf_out);
5159       /* TODO: What to do with this error? */
5160     }
5161
5162     return IO_STREAM_OKAY;
5163   }
5164
5165   /* We should never get here */
5166   return IO_STREAM_TERM;
5167 }
5168
5169 /** Parse a <b>line</b> from tor-fw-helper and issue an appropriate
5170  *  log message to our user. */
5171 static void
5172 handle_fw_helper_line(const char *executable, const char *line)
5173 {
5174   smartlist_t *tokens = smartlist_new();
5175   char *message = NULL;
5176   char *message_for_log = NULL;
5177   const char *external_port = NULL;
5178   const char *internal_port = NULL;
5179   const char *result = NULL;
5180   int port = 0;
5181   int success = 0;
5182
5183   if (strcmpstart(line, SPAWN_ERROR_MESSAGE) == 0) {
5184     /* We need to check for SPAWN_ERROR_MESSAGE again here, since it's
5185      * possible that it got sent after we tried to read it in log_from_pipe.
5186      *
5187      * XXX Ideally, we should be using one of stdout/stderr for the real
5188      * output, and one for the output of the startup code.  We used to do that
5189      * before cd05f35d2c.
5190      */
5191     int child_status;
5192     log_portfw_spawn_error_message(line, executable, &child_status);
5193     goto done;
5194   }
5195
5196   smartlist_split_string(tokens, line, NULL,
5197                          SPLIT_SKIP_SPACE|SPLIT_IGNORE_BLANK, -1);
5198
5199   if (smartlist_len(tokens) < 5)
5200     goto err;
5201
5202   if (strcmp(smartlist_get(tokens, 0), "tor-fw-helper") ||
5203       strcmp(smartlist_get(tokens, 1), "tcp-forward"))
5204     goto err;
5205
5206   external_port = smartlist_get(tokens, 2);
5207   internal_port = smartlist_get(tokens, 3);
5208   result = smartlist_get(tokens, 4);
5209
5210   if (smartlist_len(tokens) > 5) {
5211     /* If there are more than 5 tokens, they are part of [<message>].
5212        Let's use a second smartlist to form the whole message;
5213        strncat loops suck. */
5214     int i;
5215     int message_words_n = smartlist_len(tokens) - 5;
5216     smartlist_t *message_sl = smartlist_new();
5217     for (i = 0; i < message_words_n; i++)
5218       smartlist_add(message_sl, smartlist_get(tokens, 5+i));
5219
5220     tor_assert(smartlist_len(message_sl) > 0);
5221     message = smartlist_join_strings(message_sl, " ", 0, NULL);
5222
5223     /* wrap the message in log-friendly wrapping */
5224     tor_asprintf(&message_for_log, " ('%s')", message);
5225
5226     smartlist_free(message_sl);
5227   }
5228
5229   port = atoi(external_port);
5230   if (port < 1 || port > 65535)
5231     goto err;
5232
5233   port = atoi(internal_port);
5234   if (port < 1 || port > 65535)
5235     goto err;
5236
5237   if (!strcmp(result, "SUCCESS"))
5238     success = 1;
5239   else if (!strcmp(result, "FAIL"))
5240     success = 0;
5241   else
5242     goto err;
5243
5244   if (!success) {
5245     log_warn(LD_GENERAL, "Tor was unable to forward TCP port '%s' to '%s'%s. "
5246              "Please make sure that your router supports port "
5247              "forwarding protocols (like NAT-PMP). Note that if '%s' is "
5248              "your ORPort, your relay will be unable to receive inbound "
5249              "traffic.", external_port, internal_port,
5250              message_for_log ? message_for_log : "",
5251              internal_port);
5252   } else {
5253     log_info(LD_GENERAL,
5254              "Tor successfully forwarded TCP port '%s' to '%s'%s.",
5255              external_port, internal_port,
5256              message_for_log ? message_for_log : "");
5257   }
5258
5259   goto done;
5260
5261  err:
5262   log_warn(LD_GENERAL, "tor-fw-helper sent us a string we could not "
5263            "parse (%s).", line);
5264
5265  done:
5266   SMARTLIST_FOREACH(tokens, char *, cp, tor_free(cp));
5267   smartlist_free(tokens);
5268   tor_free(message);
5269   tor_free(message_for_log);
5270 }
5271
5272 /** Read what tor-fw-helper has to say in its stdout and handle it
5273  *  appropriately */
5274 static int
5275 handle_fw_helper_output(const char *executable,
5276                         process_handle_t *process_handle)
5277 {
5278   smartlist_t *fw_helper_output = NULL;
5279   enum stream_status stream_status = 0;
5280
5281   fw_helper_output =
5282     tor_get_lines_from_handle(tor_process_get_stdout_pipe(process_handle),
5283                               &stream_status);
5284   if (!fw_helper_output) { /* didn't get any output from tor-fw-helper */
5285     /* if EAGAIN we should retry in the future */
5286     return (stream_status == IO_STREAM_EAGAIN) ? 0 : -1;
5287   }
5288
5289   /* Handle the lines we got: */
5290   SMARTLIST_FOREACH_BEGIN(fw_helper_output, char *, line) {
5291     handle_fw_helper_line(executable, line);
5292     tor_free(line);
5293   } SMARTLIST_FOREACH_END(line);
5294
5295   smartlist_free(fw_helper_output);
5296
5297   return 0;
5298 }
5299
5300 /** Spawn tor-fw-helper and ask it to forward the ports in
5301  *  <b>ports_to_forward</b>. <b>ports_to_forward</b> contains strings
5302  *  of the form "<external port>:<internal port>", which is the format
5303  *  that tor-fw-helper expects. */
5304 void
5305 tor_check_port_forwarding(const char *filename,
5306                           smartlist_t *ports_to_forward,
5307                           time_t now)
5308 {
5309 /* When fw-helper succeeds, how long do we wait until running it again */
5310 #define TIME_TO_EXEC_FWHELPER_SUCCESS 300
5311 /* When fw-helper failed to start, how long do we wait until running it again
5312  */
5313 #define TIME_TO_EXEC_FWHELPER_FAIL 60
5314
5315   /* Static variables are initialized to zero, so child_handle.status=0
5316    * which corresponds to it not running on startup */
5317   static process_handle_t *child_handle=NULL;
5318
5319   static time_t time_to_run_helper = 0;
5320   int stderr_status, retval;
5321   int stdout_status = 0;
5322
5323   tor_assert(filename);
5324
5325   /* Start the child, if it is not already running */
5326   if ((!child_handle || child_handle->status != PROCESS_STATUS_RUNNING) &&
5327       time_to_run_helper < now) {
5328     /*tor-fw-helper cli looks like this: tor_fw_helper -p :5555 -p 4555:1111 */
5329     const char **argv; /* cli arguments */
5330     int args_n, status;
5331     int argv_index = 0; /* index inside 'argv' */
5332
5333     tor_assert(smartlist_len(ports_to_forward) > 0);
5334
5335     /* check for overflow during 'argv' allocation:
5336        (len(ports_to_forward)*2 + 2)*sizeof(char*) > SIZE_MAX ==
5337        len(ports_to_forward) > (((SIZE_MAX/sizeof(char*)) - 2)/2) */
5338     if ((size_t) smartlist_len(ports_to_forward) >
5339         (((SIZE_MAX/sizeof(char*)) - 2)/2)) {
5340       log_warn(LD_GENERAL,
5341                "Overflow during argv allocation. This shouldn't happen.");
5342       return;
5343     }
5344     /* check for overflow during 'argv_index' increase:
5345        ((len(ports_to_forward)*2 + 2) > INT_MAX) ==
5346        len(ports_to_forward) > (INT_MAX - 2)/2 */
5347     if (smartlist_len(ports_to_forward) > (INT_MAX - 2)/2) {
5348       log_warn(LD_GENERAL,
5349                "Overflow during argv_index increase. This shouldn't happen.");
5350       return;
5351     }
5352
5353     /* Calculate number of cli arguments: one for the filename, two
5354        for each smartlist element (one for "-p" and one for the
5355        ports), and one for the final NULL. */
5356     args_n = 1 + 2*smartlist_len(ports_to_forward) + 1;
5357     argv = tor_calloc(args_n, sizeof(char *));
5358
5359     argv[argv_index++] = filename;
5360     SMARTLIST_FOREACH_BEGIN(ports_to_forward, const char *, port) {
5361       argv[argv_index++] = "-p";
5362       argv[argv_index++] = port;
5363     } SMARTLIST_FOREACH_END(port);
5364     argv[argv_index] = NULL;
5365
5366     /* Assume tor-fw-helper will succeed, start it later*/
5367     time_to_run_helper = now + TIME_TO_EXEC_FWHELPER_SUCCESS;
5368
5369     if (child_handle) {
5370       tor_process_handle_destroy(child_handle, 1);
5371       child_handle = NULL;
5372     }
5373
5374 #ifdef _WIN32
5375     /* Passing NULL as lpApplicationName makes Windows search for the .exe */
5376     status = tor_spawn_background(NULL, argv, NULL, &child_handle);
5377 #else
5378     status = tor_spawn_background(filename, argv, NULL, &child_handle);
5379 #endif
5380
5381     tor_free_((void*)argv);
5382     argv=NULL;
5383
5384     if (PROCESS_STATUS_ERROR == status) {
5385       log_warn(LD_GENERAL, "Failed to start port forwarding helper %s",
5386               filename);
5387       time_to_run_helper = now + TIME_TO_EXEC_FWHELPER_FAIL;
5388       return;
5389     }
5390
5391     log_info(LD_GENERAL,
5392              "Started port forwarding helper (%s) with pid '%d'",
5393              filename, tor_process_get_pid(child_handle));
5394   }
5395
5396   /* If child is running, read from its stdout and stderr) */
5397   if (child_handle && PROCESS_STATUS_RUNNING == child_handle->status) {
5398     /* Read from stdout/stderr and log result */
5399     retval = 0;
5400 #ifdef _WIN32
5401     stderr_status = log_from_handle(child_handle->stderr_pipe, LOG_INFO);
5402 #else
5403     stderr_status = log_from_pipe(child_handle->stderr_handle,
5404                                   LOG_INFO, filename, &retval);
5405 #endif
5406     if (handle_fw_helper_output(filename, child_handle) < 0) {
5407       log_warn(LD_GENERAL, "Failed to handle fw helper output.");
5408       stdout_status = -1;
5409       retval = -1;
5410     }
5411
5412     if (retval) {
5413       /* There was a problem in the child process */
5414       time_to_run_helper = now + TIME_TO_EXEC_FWHELPER_FAIL;
5415     }
5416
5417     /* Combine the two statuses in order of severity */
5418     if (-1 == stdout_status || -1 == stderr_status)
5419       /* There was a failure */
5420       retval = -1;
5421 #ifdef _WIN32
5422     else if (!child_handle || tor_get_exit_code(child_handle, 0, NULL) !=
5423              PROCESS_EXIT_RUNNING) {
5424       /* process has exited or there was an error */
5425       /* TODO: Do something with the process return value */
5426       /* TODO: What if the process output something since
5427        * between log_from_handle and tor_get_exit_code? */
5428       retval = 1;
5429     }
5430 #else
5431     else if (1 == stdout_status || 1 == stderr_status)
5432       /* stdout or stderr was closed, the process probably
5433        * exited. It will be reaped by waitpid() in main.c */
5434       /* TODO: Do something with the process return value */
5435       retval = 1;
5436 #endif
5437     else
5438       /* Both are fine */
5439       retval = 0;
5440
5441     /* If either pipe indicates a failure, act on it */
5442     if (0 != retval) {
5443       if (1 == retval) {
5444         log_info(LD_GENERAL, "Port forwarding helper terminated");
5445         child_handle->status = PROCESS_STATUS_NOTRUNNING;
5446       } else {
5447         log_warn(LD_GENERAL, "Failed to read from port forwarding helper");
5448         child_handle->status = PROCESS_STATUS_ERROR;
5449       }
5450
5451       /* TODO: The child might not actually be finished (maybe it failed or
5452          closed stdout/stderr), so maybe we shouldn't start another? */
5453     }
5454   }
5455 }
5456
5457 /** Initialize the insecure RNG <b>rng</b> from a seed value <b>seed</b>. */
5458 void
5459 tor_init_weak_random(tor_weak_rng_t *rng, unsigned seed)
5460 {
5461   rng->state = (uint32_t)(seed & 0x7fffffff);
5462 }
5463
5464 /** Return a randomly chosen value in the range 0..TOR_WEAK_RANDOM_MAX based
5465  * on the RNG state of <b>rng</b>.  This entropy will not be cryptographically
5466  * strong; do not rely on it for anything an adversary should not be able to
5467  * predict. */
5468 int32_t
5469 tor_weak_random(tor_weak_rng_t *rng)
5470 {
5471   /* Here's a linear congruential generator. OpenBSD and glibc use these
5472    * parameters; they aren't too bad, and should have maximal period over the
5473    * range 0..INT32_MAX. We don't want to use the platform rand() or random(),
5474    * since some platforms have bad weak RNGs that only return values in the
5475    * range 0..INT16_MAX, which just isn't enough. */
5476   rng->state = (rng->state * 1103515245 + 12345) & 0x7fffffff;
5477   return (int32_t) rng->state;
5478 }
5479
5480 /** Return a random number in the range [0 , <b>top</b>). {That is, the range
5481  * of integers i such that 0 <= i < top.}  Chooses uniformly.  Requires that
5482  * top is greater than 0. This randomness is not cryptographically strong; do
5483  * not rely on it for anything an adversary should not be able to predict. */
5484 int32_t
5485 tor_weak_random_range(tor_weak_rng_t *rng, int32_t top)
5486 {
5487   /* We don't want to just do tor_weak_random() % top, since random() is often
5488    * implemented with an LCG whose modulus is a power of 2, and those are
5489    * cyclic in their low-order bits. */
5490   int divisor, result;
5491   tor_assert(top > 0);
5492   divisor = TOR_WEAK_RANDOM_MAX / top;
5493   do {
5494     result = (int32_t)(tor_weak_random(rng) / divisor);
5495   } while (result >= top);
5496   return result;
5497 }
5498
5499 /** Cast a given double value to a int64_t. Return 0 if number is NaN.
5500  * Returns either INT64_MIN or INT64_MAX if number is outside of the int64_t
5501  * range. */
5502 int64_t cast_double_to_int64(double number)
5503 {
5504   int exp;
5505
5506   /* NaN is a special case that can't be used with the logic below. */
5507   if (isnan(number)) {
5508     return 0;
5509   }
5510
5511   /* Time to validate if result can overflows a int64_t value. Fun with
5512    * float! Find that exponent exp such that
5513    *    number == x * 2^exp
5514    * for some x with abs(x) in [0.5, 1.0). Note that this implies that the
5515    * magnitude of number is strictly less than 2^exp.
5516    *
5517    * If number is infinite, the call to frexp is legal but the contents of
5518    * exp are unspecified. */
5519   frexp(number, &exp);
5520
5521   /* If the magnitude of number is strictly less than 2^63, the truncated
5522    * version of number is guaranteed to be representable. The only
5523    * representable integer for which this is not the case is INT64_MIN, but
5524    * it is covered by the logic below. */
5525   if (isfinite(number) && exp <= 63) {
5526     return number;
5527   }
5528
5529   /* Handle infinities and finite numbers with magnitude >= 2^63. */
5530   return signbit(number) ? INT64_MIN : INT64_MAX;
5531 }