src/or/buffers.c

   1 /* Copyright (c) 2001 Matej Pfajfar.
   2  * Copyright (c) 2001-2004, Roger Dingledine.
   3  * Copyright (c) 2004-2006, Roger Dingledine, Nick Mathewson.
   4  * Copyright (c) 2007-2013, The Tor Project, Inc. */
   5 /* See LICENSE for licensing information */
   6
   7 /**
   8  * \file buffers.c
   9  * \brief Implements a generic interface buffer.  Buffers are
  10  * fairly opaque string holders that can read to or flush from:
  11  * memory, file descriptors, or TLS connections.
  12  **/
  13 #define BUFFERS_PRIVATE
  14 #include "or.h"
  15 #include "addressmap.h"
  16 #include "buffers.h"
  17 #include "config.h"
  18 #include "connection_edge.h"
  19 #include "connection_or.h"
  20 #include "control.h"
  21 #include "reasons.h"
  22 #include "ext_orport.h"
  23 #include "../common/util.h"
  24 #include "../common/torlog.h"
  25 #ifdef HAVE_UNISTD_H
  26 #include <unistd.h>
  27 #endif
  28
  29 //#define PARANOIA
  30
  31 #ifdef PARANOIA
  32 /** Helper: If PARANOIA is defined, assert that the buffer in local variable
  33  * <b>buf</b> is well-formed. */
  34 #define check() STMT_BEGIN assert_buf_ok(buf); STMT_END
  35 #else
  36 #define check() STMT_NIL
  37 #endif
  38
  39 /* Implementation notes:
  40  *
  41  * After flirting with memmove, and dallying with ring-buffers, we're finally
  42  * getting up to speed with the 1970s and implementing buffers as a linked
  43  * list of small chunks.  Each buffer has such a list; data is removed from
  44  * the head of the list, and added at the tail.  The list is singly linked,
  45  * and the buffer keeps a pointer to the head and the tail.
  46  *
  47  * Every chunk, except the tail, contains at least one byte of data.  Data in
  48  * each chunk is contiguous.
  49  *
  50  * When you need to treat the first N characters on a buffer as a contiguous
  51  * string, use the buf_pullup function to make them so.  Don't do this more
  52  * than necessary.
  53  *
  54  * The major free Unix kernels have handled buffers like this since, like,
  55  * forever.
  56  */
  57
  58 static int parse_socks(const char *data, size_t datalen, socks_request_t *req,
  59                        int log_sockstype, int safe_socks, ssize_t *drain_out,
  60                        size_t *want_length_out);
  61 static int parse_socks_client(const uint8_t *data, size_t datalen,
  62                               int state, char **reason,
  63                               ssize_t *drain_out);
  64
  65 /* Chunk manipulation functions */
  66
  67 #define CHUNK_HEADER_LEN STRUCT_OFFSET(chunk_t, mem[0])
  68
  69 /** Return the number of bytes needed to allocate a chunk to hold
  70  * <b>memlen</b> bytes. */
  71 #define CHUNK_ALLOC_SIZE(memlen) (CHUNK_HEADER_LEN + (memlen))
  72 /** Return the number of usable bytes in a chunk allocated with
  73  * malloc(<b>memlen</b>). */
  74 #define CHUNK_SIZE_WITH_ALLOC(memlen) ((memlen) - CHUNK_HEADER_LEN)
  75
  76 /** Return the next character in <b>chunk</b> onto which data can be appended.
  77  * If the chunk is full, this might be off the end of chunk->mem. */
  78 static INLINE char *
  79 CHUNK_WRITE_PTR(chunk_t *chunk)
  80 {
  81   return chunk->data + chunk->datalen;
  82 }
  83
  84 /** Return the number of bytes that can be written onto <b>chunk</b> without
  85  * running out of space. */
  86 static INLINE size_t
  87 CHUNK_REMAINING_CAPACITY(const chunk_t *chunk)
  88 {
  89   return (chunk->mem + chunk->memlen) - (chunk->data + chunk->datalen);
  90 }
  91
  92 /** Move all bytes stored in <b>chunk</b> to the front of <b>chunk</b>->mem,
  93  * to free up space at the end. */
  94 static INLINE void
  95 chunk_repack(chunk_t *chunk)
  96 {
  97   if (chunk->datalen && chunk->data != &chunk->mem[0]) {
  98     memmove(chunk->mem, chunk->data, chunk->datalen);
  99   }
 100   chunk->data = &chunk->mem[0];
 101 }
 102
 103 /** Keep track of total size of allocated chunks for consistency asserts */
 104 static size_t total_bytes_allocated_in_chunks = 0;
 105
 106 #if defined(ENABLE_BUF_FREELISTS) || defined(RUNNING_DOXYGEN)
 107 /** A freelist of chunks. */
 108 typedef struct chunk_freelist_t {
 109   size_t alloc_size; /**< What size chunks does this freelist hold? */
 110   int max_length; /**< Never allow more than this number of chunks in the
 111                    * freelist. */
 112   int slack; /**< When trimming the freelist, leave this number of extra
 113               * chunks beyond lowest_length.*/
 114   int cur_length; /**< How many chunks on the freelist now? */
 115   int lowest_length; /**< What's the smallest value of cur_length since the
 116                       * last time we cleaned this freelist? */
 117   uint64_t n_alloc;
 118   uint64_t n_free;
 119   uint64_t n_hit;
 120   chunk_t *head; /**< First chunk on the freelist. */
 121 } chunk_freelist_t;
 122
 123 /** Macro to help define freelists. */
 124 #define FL(a,m,s) { a, m, s, 0, 0, 0, 0, 0, NULL }
 125
 126 /** Static array of freelists, sorted by alloc_len, terminated by an entry
 127  * with alloc_size of 0. */
 128 static chunk_freelist_t freelists[] = {
 129   FL(4096, 256, 8), FL(8192, 128, 4), FL(16384, 64, 4), FL(32768, 32, 2),
 130   FL(0, 0, 0)
 131 };
 132 #undef FL
 133 /** How many times have we looked for a chunk of a size that no freelist
 134  * could help with? */
 135 static uint64_t n_freelist_miss = 0;
 136
 137 static void assert_freelist_ok(chunk_freelist_t *fl);
 138
 139 /** Return the freelist to hold chunks of size <b>alloc</b>, or NULL if
 140  * no freelist exists for that size. */
 141 static INLINE chunk_freelist_t *
 142 get_freelist(size_t alloc)
 143 {
 144   int i;
 145   for (i=0; (freelists[i].alloc_size <= alloc &&
 146              freelists[i].alloc_size); ++i ) {
 147     if (freelists[i].alloc_size == alloc) {
 148       return &freelists[i];
 149     }
 150   }
 151   return NULL;
 152 }
 153
 154 /** Deallocate a chunk or put it on a freelist */
 155 static void
 156 chunk_free_unchecked(chunk_t *chunk)
 157 {
 158   size_t alloc;
 159   chunk_freelist_t *freelist;
 160
 161   alloc = CHUNK_ALLOC_SIZE(chunk->memlen);
 162   freelist = get_freelist(alloc);
 163   if (freelist && freelist->cur_length < freelist->max_length) {
 164     chunk->next = freelist->head;
 165     freelist->head = chunk;
 166     ++freelist->cur_length;
 167   } else {
 168     if (freelist)
 169       ++freelist->n_free;
 170 #ifdef DEBUG_CHUNK_ALLOC
 171     tor_assert(alloc  == chunk->DBG_alloc);
 172 #endif
 173     tor_assert(total_bytes_allocated_in_chunks >= alloc);
 174     total_bytes_allocated_in_chunks -= alloc;
 175     tor_free(chunk);
 176   }
 177 }
 178
 179 /** Allocate a new chunk with a given allocation size, or get one from the
 180  * freelist.  Note that a chunk with allocation size A can actually hold only
 181  * CHUNK_SIZE_WITH_ALLOC(A) bytes in its mem field. */
 182 static INLINE chunk_t *
 183 chunk_new_with_alloc_size(size_t alloc)
 184 {
 185   chunk_t *ch;
 186   chunk_freelist_t *freelist;
 187   tor_assert(alloc >= sizeof(chunk_t));
 188   freelist = get_freelist(alloc);
 189   if (freelist && freelist->head) {
 190     ch = freelist->head;
 191     freelist->head = ch->next;
 192     if (--freelist->cur_length < freelist->lowest_length)
 193       freelist->lowest_length = freelist->cur_length;
 194     ++freelist->n_hit;
 195   } else {
 196     if (freelist)
 197       ++freelist->n_alloc;
 198     else
 199       ++n_freelist_miss;
 200     ch = tor_malloc(alloc);
 201 #ifdef DEBUG_CHUNK_ALLOC
 202     ch->DBG_alloc = alloc;
 203 #endif
 204     total_bytes_allocated_in_chunks += alloc;
 205   }
 206   ch->next = NULL;
 207   ch->datalen = 0;
 208   ch->memlen = CHUNK_SIZE_WITH_ALLOC(alloc);
 209   ch->data = &ch->mem[0];
 210   return ch;
 211 }
 212 #else
 213 static void
 214 chunk_free_unchecked(chunk_t *chunk)
 215 {
 216   if (!chunk)
 217     return;
 218 #ifdef DEBUG_CHUNK_ALLOC
 219   tor_assert(CHUNK_ALLOC_SIZE(chunk->memlen) == chunk->DBG_alloc);
 220 #endif
 221   tor_assert(total_bytes_allocated_in_chunks >=
 222              CHUNK_ALLOC_SIZE(chunk->memlen));
 223   total_bytes_allocated_in_chunks -= CHUNK_ALLOC_SIZE(chunk->memlen);
 224   tor_free(chunk);
 225 }
 226 static INLINE chunk_t *
 227 chunk_new_with_alloc_size(size_t alloc)
 228 {
 229   chunk_t *ch;
 230   ch = tor_malloc(alloc);
 231   ch->next = NULL;
 232   ch->datalen = 0;
 233 #ifdef DEBUG_CHUNK_ALLOC
 234   ch->DBG_alloc = alloc;
 235 #endif
 236   ch->memlen = CHUNK_SIZE_WITH_ALLOC(alloc);
 237   total_bytes_allocated_in_chunks += alloc;
 238   ch->data = &ch->mem[0];
 239   return ch;
 240 }
 241 #endif
 242
 243 /** Expand <b>chunk</b> until it can hold <b>sz</b> bytes, and return a
 244  * new pointer to <b>chunk</b>.  Old pointers are no longer valid. */
 245 static INLINE chunk_t *
 246 chunk_grow(chunk_t *chunk, size_t sz)
 247 {
 248   off_t offset;
 249   size_t memlen_orig = chunk->memlen;
 250   tor_assert(sz > chunk->memlen);
 251   offset = chunk->data - chunk->mem;
 252   chunk = tor_realloc(chunk, CHUNK_ALLOC_SIZE(sz));
 253   chunk->memlen = sz;
 254   chunk->data = chunk->mem + offset;
 255 #ifdef DEBUG_CHUNK_ALLOC
 256   tor_assert(chunk->DBG_alloc == CHUNK_ALLOC_SIZE(memlen_orig));
 257   chunk->DBG_alloc = CHUNK_ALLOC_SIZE(sz);
 258 #endif
 259   total_bytes_allocated_in_chunks +=
 260     CHUNK_ALLOC_SIZE(sz) - CHUNK_ALLOC_SIZE(memlen_orig);
 261   return chunk;
 262 }
 263
 264 /** If a read onto the end of a chunk would be smaller than this number, then
 265  * just start a new chunk. */
 266 #define MIN_READ_LEN 8
 267 /** Every chunk should take up at least this many bytes. */
 268 #define MIN_CHUNK_ALLOC 256
 269 /** No chunk should take up more than this many bytes. */
 270 #define MAX_CHUNK_ALLOC 65536
 271
 272 /** Return the allocation size we'd like to use to hold <b>target</b>
 273  * bytes. */
 274 static INLINE size_t
 275 preferred_chunk_size(size_t target)
 276 {
 277   size_t sz = MIN_CHUNK_ALLOC;
 278   while (CHUNK_SIZE_WITH_ALLOC(sz) < target) {
 279     sz <<= 1;
 280   }
 281   return sz;
 282 }
 283
 284 /** Remove from the freelists most chunks that have not been used since the
 285  * last call to buf_shrink_freelists().   Return the amount of memory
 286  * freed. */
 287 size_t
 288 buf_shrink_freelists(int free_all)
 289 {
 290 #ifdef ENABLE_BUF_FREELISTS
 291   int i;
 292   size_t total_freed = 0;
 293   disable_control_logging();
 294   for (i = 0; freelists[i].alloc_size; ++i) {
 295     int slack = freelists[i].slack;
 296     assert_freelist_ok(&freelists[i]);
 297     if (free_all || freelists[i].lowest_length > slack) {
 298       int n_to_free = free_all ? freelists[i].cur_length :
 299         (freelists[i].lowest_length - slack);
 300       int n_to_skip = freelists[i].cur_length - n_to_free;
 301       int orig_length = freelists[i].cur_length;
 302       int orig_n_to_free = n_to_free, n_freed=0;
 303       int orig_n_to_skip = n_to_skip;
 304       int new_length = n_to_skip;
 305       chunk_t **chp = &freelists[i].head;
 306       chunk_t *chunk;
 307       while (n_to_skip) {
 308         if (!(*chp) || ! (*chp)->next) {
 309           log_warn(LD_BUG, "I wanted to skip %d chunks in the freelist for "
 310                    "%d-byte chunks, but only found %d. (Length %d)",
 311                    orig_n_to_skip, (int)freelists[i].alloc_size,
 312                    orig_n_to_skip-n_to_skip, freelists[i].cur_length);
 313           assert_freelist_ok(&freelists[i]);
 314           goto done;
 315         }
 316         // tor_assert((*chp)->next);
 317         chp = &(*chp)->next;
 318         --n_to_skip;
 319       }
 320       chunk = *chp;
 321       *chp = NULL;
 322       while (chunk) {
 323         chunk_t *next = chunk->next;
 324 #ifdef DEBUG_CHUNK_ALLOC
 325         tor_assert(chunk->DBG_alloc == CHUNK_ALLOC_SIZE(chunk->memlen));
 326 #endif
 327         tor_assert(total_bytes_allocated_in_chunks >=
 328                    CHUNK_ALLOC_SIZE(chunk->memlen));
 329         total_bytes_allocated_in_chunks -= CHUNK_ALLOC_SIZE(chunk->memlen);
 330         total_freed += CHUNK_ALLOC_SIZE(chunk->memlen);
 331         tor_free(chunk);
 332         chunk = next;
 333         --n_to_free;
 334         ++n_freed;
 335         ++freelists[i].n_free;
 336       }
 337       if (n_to_free) {
 338         log_warn(LD_BUG, "Freelist length for %d-byte chunks may have been "
 339                  "messed up somehow.", (int)freelists[i].alloc_size);
 340         log_warn(LD_BUG, "There were %d chunks at the start.  I decided to "
 341                  "keep %d. I wanted to free %d.  I freed %d.  I somehow think "
 342                  "I have %d left to free.",
 343                  freelists[i].cur_length, n_to_skip, orig_n_to_free,
 344                  n_freed, n_to_free);
 345       }
 346       // tor_assert(!n_to_free);
 347       freelists[i].cur_length = new_length;
 348       tor_assert(orig_n_to_skip == new_length);
 349       log_info(LD_MM, "Cleaned freelist for %d-byte chunks: original "
 350                "length %d, kept %d, dropped %d. New length is %d",
 351                (int)freelists[i].alloc_size, orig_length,
 352                orig_n_to_skip, orig_n_to_free, new_length);
 353     }
 354     freelists[i].lowest_length = freelists[i].cur_length;
 355     assert_freelist_ok(&freelists[i]);
 356   }
 357  done:
 358   enable_control_logging();
 359   return total_freed;
 360 #else
 361   (void) free_all;
 362   return 0;
 363 #endif
 364 }
 365
 366 /** Describe the current status of the freelists at log level <b>severity</b>.
 367  */
 368 void
 369 buf_dump_freelist_sizes(int severity)
 370 {
 371 #ifdef ENABLE_BUF_FREELISTS
 372   int i;
 373   tor_log(severity, LD_MM, "====== Buffer freelists:");
 374   for (i = 0; freelists[i].alloc_size; ++i) {
 375     uint64_t total = ((uint64_t)freelists[i].cur_length) *
 376       freelists[i].alloc_size;
 377     tor_log(severity, LD_MM,
 378         U64_FORMAT" bytes in %d %d-byte chunks ["U64_FORMAT
 379         " misses; "U64_FORMAT" frees; "U64_FORMAT" hits]",
 380         U64_PRINTF_ARG(total),
 381         freelists[i].cur_length, (int)freelists[i].alloc_size,
 382         U64_PRINTF_ARG(freelists[i].n_alloc),
 383         U64_PRINTF_ARG(freelists[i].n_free),
 384         U64_PRINTF_ARG(freelists[i].n_hit));
 385   }
 386   tor_log(severity, LD_MM, U64_FORMAT" allocations in non-freelist sizes",
 387       U64_PRINTF_ARG(n_freelist_miss));
 388 #else
 389   (void)severity;
 390 #endif
 391 }
 392
 393 /** Collapse data from the first N chunks from <b>buf</b> into buf->head,
 394  * growing it as necessary, until buf->head has the first <b>bytes</b> bytes
 395  * of data from the buffer, or until buf->head has all the data in <b>buf</b>.
 396  *
 397  * If <b>nulterminate</b> is true, ensure that there is a 0 byte in
 398  * buf->head->mem right after all the data. */
 399 STATIC void
 400 buf_pullup(buf_t *buf, size_t bytes, int nulterminate)
 401 {
 402   /* XXXX nothing uses nulterminate; remove it. */
 403   chunk_t *dest, *src;
 404   size_t capacity;
 405   if (!buf->head)
 406     return;
 407
 408   check();
 409   if (buf->datalen < bytes)
 410     bytes = buf->datalen;
 411
 412   if (nulterminate) {
 413     capacity = bytes + 1;
 414     if (buf->head->datalen >= bytes && CHUNK_REMAINING_CAPACITY(buf->head)) {
 415       *CHUNK_WRITE_PTR(buf->head) = '\0';
 416       return;
 417     }
 418   } else {
 419     capacity = bytes;
 420     if (buf->head->datalen >= bytes)
 421       return;
 422   }
 423
 424   if (buf->head->memlen >= capacity) {
 425     /* We don't need to grow the first chunk, but we might need to repack it.*/
 426     size_t needed = capacity - buf->head->datalen;
 427     if (CHUNK_REMAINING_CAPACITY(buf->head) < needed)
 428       chunk_repack(buf->head);
 429     tor_assert(CHUNK_REMAINING_CAPACITY(buf->head) >= needed);
 430   } else {
 431     chunk_t *newhead;
 432     size_t newsize;
 433     /* We need to grow the chunk. */
 434     chunk_repack(buf->head);
 435     newsize = CHUNK_SIZE_WITH_ALLOC(preferred_chunk_size(capacity));
 436     newhead = chunk_grow(buf->head, newsize);
 437     tor_assert(newhead->memlen >= capacity);
 438     if (newhead != buf->head) {
 439       if (buf->tail == buf->head)
 440         buf->tail = newhead;
 441       buf->head = newhead;
 442     }
 443   }
 444
 445   dest = buf->head;
 446   while (dest->datalen < bytes) {
 447     size_t n = bytes - dest->datalen;
 448     src = dest->next;
 449     tor_assert(src);
 450     if (n > src->datalen) {
 451       memcpy(CHUNK_WRITE_PTR(dest), src->data, src->datalen);
 452       dest->datalen += src->datalen;
 453       dest->next = src->next;
 454       if (buf->tail == src)
 455         buf->tail = dest;
 456       chunk_free_unchecked(src);
 457     } else {
 458       memcpy(CHUNK_WRITE_PTR(dest), src->data, n);
 459       dest->datalen += n;
 460       src->data += n;
 461       src->datalen -= n;
 462       tor_assert(dest->datalen == bytes);
 463     }
 464   }
 465
 466   if (nulterminate) {
 467     tor_assert(CHUNK_REMAINING_CAPACITY(buf->head));
 468     *CHUNK_WRITE_PTR(buf->head) = '\0';
 469   }
 470
 471   check();
 472 }
 473
 474 #ifdef TOR_UNIT_TESTS
 475 void
 476 buf_get_first_chunk_data(const buf_t *buf, const char **cp, size_t *sz)
 477 {
 478   if (!buf || !buf->head) {
 479     *cp = NULL;
 480     *sz = 0;
 481   } else {
 482     *cp = buf->head->data;
 483     *sz = buf->head->datalen;
 484   }
 485 }
 486 #endif
 487
 488 /** Resize buf so it won't hold extra memory that we haven't been
 489  * using lately.
 490  */
 491 void
 492 buf_shrink(buf_t *buf)
 493 {
 494   (void)buf;
 495 }
 496
 497 /** Remove the first <b>n</b> bytes from buf. */
 498 static INLINE void
 499 buf_remove_from_front(buf_t *buf, size_t n)
 500 {
 501   tor_assert(buf->datalen >= n);
 502   while (n) {
 503     tor_assert(buf->head);
 504     if (buf->head->datalen > n) {
 505       buf->head->datalen -= n;
 506       buf->head->data += n;
 507       buf->datalen -= n;
 508       return;
 509     } else {
 510       chunk_t *victim = buf->head;
 511       n -= victim->datalen;
 512       buf->datalen -= victim->datalen;
 513       buf->head = victim->next;
 514       if (buf->tail == victim)
 515         buf->tail = NULL;
 516       chunk_free_unchecked(victim);
 517     }
 518   }
 519   check();
 520 }
 521
 522 /** Create and return a new buf with default chunk capacity <b>size</b>.
 523  */
 524 buf_t *
 525 buf_new_with_capacity(size_t size)
 526 {
 527   buf_t *b = buf_new();
 528   b->default_chunk_size = preferred_chunk_size(size);
 529   return b;
 530 }
 531
 532 /** Allocate and return a new buffer with default capacity. */
 533 buf_t *
 534 buf_new(void)
 535 {
 536   buf_t *buf = tor_malloc_zero(sizeof(buf_t));
 537   buf->magic = BUFFER_MAGIC;
 538   buf->default_chunk_size = 4096;
 539   return buf;
 540 }
 541
 542 size_t
 543 buf_get_default_chunk_size(const buf_t *buf)
 544 {
 545   return buf->default_chunk_size;
 546 }
 547
 548 /** Remove all data from <b>buf</b>. */
 549 void
 550 buf_clear(buf_t *buf)
 551 {
 552   chunk_t *chunk, *next;
 553   buf->datalen = 0;
 554   for (chunk = buf->head; chunk; chunk = next) {
 555     next = chunk->next;
 556     chunk_free_unchecked(chunk);
 557   }
 558   buf->head = buf->tail = NULL;
 559 }
 560
 561 /** Return the number of bytes stored in <b>buf</b> */
 562 size_t
 563 buf_datalen(const buf_t *buf)
 564 {
 565   return buf->datalen;
 566 }
 567
 568 /** Return the total length of all chunks used in <b>buf</b>. */
 569 size_t
 570 buf_allocation(const buf_t *buf)
 571 {
 572   size_t total = 0;
 573   const chunk_t *chunk;
 574   for (chunk = buf->head; chunk; chunk = chunk->next) {
 575     total += CHUNK_ALLOC_SIZE(chunk->memlen);
 576   }
 577   return total;
 578 }
 579
 580 /** Return the number of bytes that can be added to <b>buf</b> without
 581  * performing any additional allocation. */
 582 size_t
 583 buf_slack(const buf_t *buf)
 584 {
 585   if (!buf->tail)
 586     return 0;
 587   else
 588     return CHUNK_REMAINING_CAPACITY(buf->tail);
 589 }
 590
 591 /** Release storage held by <b>buf</b>. */
 592 void
 593 buf_free(buf_t *buf)
 594 {
 595   if (!buf)
 596     return;
 597
 598   buf_clear(buf);
 599   buf->magic = 0xdeadbeef;
 600   tor_free(buf);
 601 }
 602
 603 /** Return a new copy of <b>in_chunk</b> */
 604 static chunk_t *
 605 chunk_copy(const chunk_t *in_chunk)
 606 {
 607   chunk_t *newch = tor_memdup(in_chunk, CHUNK_ALLOC_SIZE(in_chunk->memlen));
 608   total_bytes_allocated_in_chunks += CHUNK_ALLOC_SIZE(in_chunk->memlen);
 609 #ifdef DEBUG_CHUNK_ALLOC
 610   newch->DBG_alloc = CHUNK_ALLOC_SIZE(in_chunk->memlen);
 611 #endif
 612   newch->next = NULL;
 613   if (in_chunk->data) {
 614     off_t offset = in_chunk->data - in_chunk->mem;
 615     newch->data = newch->mem + offset;
 616   }
 617   return newch;
 618 }
 619
 620 /** Return a new copy of <b>buf</b> */
 621 buf_t *
 622 buf_copy(const buf_t *buf)
 623 {
 624   chunk_t *ch;
 625   buf_t *out = buf_new();
 626   out->default_chunk_size = buf->default_chunk_size;
 627   for (ch = buf->head; ch; ch = ch->next) {
 628     chunk_t *newch = chunk_copy(ch);
 629     if (out->tail) {
 630       out->tail->next = newch;
 631       out->tail = newch;
 632     } else {
 633       out->head = out->tail = newch;
 634     }
 635   }
 636   out->datalen = buf->datalen;
 637   return out;
 638 }
 639
 640 /** Append a new chunk with enough capacity to hold <b>capacity</b> bytes to
 641  * the tail of <b>buf</b>.  If <b>capped</b>, don't allocate a chunk bigger
 642  * than MAX_CHUNK_ALLOC. */
 643 static chunk_t *
 644 buf_add_chunk_with_capacity(buf_t *buf, size_t capacity, int capped)
 645 {
 646   chunk_t *chunk;
 647   struct timeval now;
 648   if (CHUNK_ALLOC_SIZE(capacity) < buf->default_chunk_size) {
 649     chunk = chunk_new_with_alloc_size(buf->default_chunk_size);
 650   } else if (capped && CHUNK_ALLOC_SIZE(capacity) > MAX_CHUNK_ALLOC) {
 651     chunk = chunk_new_with_alloc_size(MAX_CHUNK_ALLOC);
 652   } else {
 653     chunk = chunk_new_with_alloc_size(preferred_chunk_size(capacity));
 654   }
 655
 656   tor_gettimeofday_cached_monotonic(&now);
 657   chunk->inserted_time = (uint32_t)tv_to_msec(&now);
 658
 659   if (buf->tail) {
 660     tor_assert(buf->head);
 661     buf->tail->next = chunk;
 662     buf->tail = chunk;
 663   } else {
 664     tor_assert(!buf->head);
 665     buf->head = buf->tail = chunk;
 666   }
 667   check();
 668   return chunk;
 669 }
 670
 671 /** Return the age of the oldest chunk in the buffer <b>buf</b>, in
 672  * milliseconds.  Requires the current time, in truncated milliseconds since
 673  * the epoch, as its input <b>now</b>.
 674  */
 675 uint32_t
 676 buf_get_oldest_chunk_timestamp(const buf_t *buf, uint32_t now)
 677 {
 678   if (buf->head) {
 679     return now - buf->head->inserted_time;
 680   } else {
 681     return 0;
 682   }
 683 }
 684
 685 size_t
 686 buf_get_total_allocation(void)
 687 {
 688   return total_bytes_allocated_in_chunks;
 689 }
 690
 691 /** Read up to <b>at_most</b> bytes from the socket <b>fd</b> into
 692  * <b>chunk</b> (which must be on <b>buf</b>). If we get an EOF, set
 693  * *<b>reached_eof</b> to 1.  Return -1 on error, 0 on eof or blocking,
 694  * and the number of bytes read otherwise. */
 695 static INLINE int
 696 read_to_chunk(buf_t *buf, chunk_t *chunk, tor_socket_t fd, size_t at_most,
 697               int *reached_eof, int *socket_error)
 698 {
 699   ssize_t read_result;
 700   if (at_most > CHUNK_REMAINING_CAPACITY(chunk))
 701     at_most = CHUNK_REMAINING_CAPACITY(chunk);
 702   read_result = tor_socket_recv(fd, CHUNK_WRITE_PTR(chunk), at_most, 0);
 703
 704   if (read_result < 0) {
 705     int e = tor_socket_errno(fd);
 706     if (!ERRNO_IS_EAGAIN(e)) { /* it's a real error */
 707 #ifdef _WIN32
 708       if (e == WSAENOBUFS)
 709         log_warn(LD_NET,"recv() failed: WSAENOBUFS. Not enough ram?");
 710 #endif
 711       *socket_error = e;
 712       return -1;
 713     }
 714     return 0; /* would block. */
 715   } else if (read_result == 0) {
 716     log_debug(LD_NET,"Encountered eof on fd %d", (int)fd);
 717     *reached_eof = 1;
 718     return 0;
 719   } else { /* actually got bytes. */
 720     buf->datalen += read_result;
 721     chunk->datalen += read_result;
 722     log_debug(LD_NET,"Read %ld bytes. %d on inbuf.", (long)read_result,
 723               (int)buf->datalen);
 724     tor_assert(read_result < INT_MAX);
 725     return (int)read_result;
 726   }
 727 }
 728
 729 /** As read_to_chunk(), but return (negative) error code on error, blocking,
 730  * or TLS, and the number of bytes read otherwise. */
 731 static INLINE int
 732 read_to_chunk_tls(buf_t *buf, chunk_t *chunk, tor_tls_t *tls,
 733                   size_t at_most)
 734 {
 735   int read_result;
 736
 737   tor_assert(CHUNK_REMAINING_CAPACITY(chunk) >= at_most);
 738   read_result = tor_tls_read(tls, CHUNK_WRITE_PTR(chunk), at_most);
 739   if (read_result < 0)
 740     return read_result;
 741   buf->datalen += read_result;
 742   chunk->datalen += read_result;
 743   return read_result;
 744 }
 745
 746 /** Read from socket <b>s</b>, writing onto end of <b>buf</b>.  Read at most
 747  * <b>at_most</b> bytes, growing the buffer as necessary.  If recv() returns 0
 748  * (because of EOF), set *<b>reached_eof</b> to 1 and return 0. Return -1 on
 749  * error; else return the number of bytes read.
 750  */
 751 /* XXXX024 indicate "read blocked" somehow? */
 752 int
 753 read_to_buf(tor_socket_t s, size_t at_most, buf_t *buf, int *reached_eof,
 754             int *socket_error)
 755 {
 756   /* XXXX024 It's stupid to overload the return values for these functions:
 757    * "error status" and "number of bytes read" are not mutually exclusive.
 758    */
 759   int r = 0;
 760   size_t total_read = 0;
 761
 762   check();
 763   tor_assert(reached_eof);
 764   tor_assert(SOCKET_OK(s));
 765
 766   while (at_most > total_read) {
 767     size_t readlen = at_most - total_read;
 768     chunk_t *chunk;
 769     if (!buf->tail || CHUNK_REMAINING_CAPACITY(buf->tail) < MIN_READ_LEN) {
 770       chunk = buf_add_chunk_with_capacity(buf, at_most, 1);
 771       if (readlen > chunk->memlen)
 772         readlen = chunk->memlen;
 773     } else {
 774       size_t cap = CHUNK_REMAINING_CAPACITY(buf->tail);
 775       chunk = buf->tail;
 776       if (cap < readlen)
 777         readlen = cap;
 778     }
 779
 780     r = read_to_chunk(buf, chunk, s, readlen, reached_eof, socket_error);
 781     check();
 782     if (r < 0)
 783       return r; /* Error */
 784     tor_assert(total_read+r < INT_MAX);
 785     total_read += r;
 786     if ((size_t)r < readlen) { /* eof, block, or no more to read. */
 787       break;
 788     }
 789   }
 790   return (int)total_read;
 791 }
 792
 793 /** As read_to_buf, but reads from a TLS connection, and returns a TLS
 794  * status value rather than the number of bytes read.
 795  *
 796  * Using TLS on OR connections complicates matters in two ways.
 797  *
 798  * First, a TLS stream has its own read buffer independent of the
 799  * connection's read buffer.  (TLS needs to read an entire frame from
 800  * the network before it can decrypt any data.  Thus, trying to read 1
 801  * byte from TLS can require that several KB be read from the network
 802  * and decrypted.  The extra data is stored in TLS's decrypt buffer.)
 803  * Because the data hasn't been read by Tor (it's still inside the TLS),
 804  * this means that sometimes a connection "has stuff to read" even when
 805  * poll() didn't return POLLIN. The tor_tls_get_pending_bytes function is
 806  * used in connection.c to detect TLS objects with non-empty internal
 807  * buffers and read from them again.
 808  *
 809  * Second, the TLS stream's events do not correspond directly to network
 810  * events: sometimes, before a TLS stream can read, the network must be
 811  * ready to write -- or vice versa.
 812  */
 813 int
 814 read_to_buf_tls(tor_tls_t *tls, size_t at_most, buf_t *buf)
 815 {
 816   int r = 0;
 817   size_t total_read = 0;
 818
 819   check_no_tls_errors();
 820
 821   check();
 822
 823   while (at_most > total_read) {
 824     size_t readlen = at_most - total_read;
 825     chunk_t *chunk;
 826     if (!buf->tail || CHUNK_REMAINING_CAPACITY(buf->tail) < MIN_READ_LEN) {
 827       chunk = buf_add_chunk_with_capacity(buf, at_most, 1);
 828       if (readlen > chunk->memlen)
 829         readlen = chunk->memlen;
 830     } else {
 831       size_t cap = CHUNK_REMAINING_CAPACITY(buf->tail);
 832       chunk = buf->tail;
 833       if (cap < readlen)
 834         readlen = cap;
 835     }
 836
 837     r = read_to_chunk_tls(buf, chunk, tls, readlen);
 838     check();
 839     if (r < 0)
 840       return r; /* Error */
 841     tor_assert(total_read+r < INT_MAX);
 842      total_read += r;
 843     if ((size_t)r < readlen) /* eof, block, or no more to read. */
 844       break;
 845   }
 846   return (int)total_read;
 847 }
 848
 849 /** Helper for flush_buf(): try to write <b>sz</b> bytes from chunk
 850  * <b>chunk</b> of buffer <b>buf</b> onto socket <b>s</b>.  On success, deduct
 851  * the bytes written from *<b>buf_flushlen</b>.  Return the number of bytes
 852  * written on success, 0 on blocking, -1 on failure.
 853  */
 854 static INLINE int
 855 flush_chunk(tor_socket_t s, buf_t *buf, chunk_t *chunk, size_t sz,
 856             size_t *buf_flushlen)
 857 {
 858   ssize_t write_result;
 859
 860   if (sz > chunk->datalen)
 861     sz = chunk->datalen;
 862   write_result = tor_socket_send(s, chunk->data, sz, 0);
 863
 864   if (write_result < 0) {
 865     int e = tor_socket_errno(s);
 866     if (!ERRNO_IS_EAGAIN(e)) { /* it's a real error */
 867 #ifdef _WIN32
 868       if (e == WSAENOBUFS)
 869         log_warn(LD_NET,"write() failed: WSAENOBUFS. Not enough ram?");
 870 #endif
 871       return -1;
 872     }
 873     log_debug(LD_NET,"write() would block, returning.");
 874     return 0;
 875   } else {
 876     *buf_flushlen -= write_result;
 877     buf_remove_from_front(buf, write_result);
 878     tor_assert(write_result < INT_MAX);
 879     return (int)write_result;
 880   }
 881 }
 882
 883 /** Helper for flush_buf_tls(): try to write <b>sz</b> bytes from chunk
 884  * <b>chunk</b> of buffer <b>buf</b> onto socket <b>s</b>.  (Tries to write
 885  * more if there is a forced pending write size.)  On success, deduct the
 886  * bytes written from *<b>buf_flushlen</b>.  Return the number of bytes
 887  * written on success, and a TOR_TLS error code on failure or blocking.
 888  */
 889 static INLINE int
 890 flush_chunk_tls(tor_tls_t *tls, buf_t *buf, chunk_t *chunk,
 891                 size_t sz, size_t *buf_flushlen)
 892 {
 893   int r;
 894   size_t forced;
 895   char *data;
 896
 897   forced = tor_tls_get_forced_write_size(tls);
 898   if (forced > sz)
 899     sz = forced;
 900   if (chunk) {
 901     data = chunk->data;
 902     tor_assert(sz <= chunk->datalen);
 903   } else {
 904     data = NULL;
 905     tor_assert(sz == 0);
 906   }
 907   r = tor_tls_write(tls, data, sz);
 908   if (r < 0)
 909     return r;
 910   if (*buf_flushlen > (size_t)r)
 911     *buf_flushlen -= r;
 912   else
 913     *buf_flushlen = 0;
 914   buf_remove_from_front(buf, r);
 915   log_debug(LD_NET,"flushed %d bytes, %d ready to flush, %d remain.",
 916             r,(int)*buf_flushlen,(int)buf->datalen);
 917   return r;
 918 }
 919
 920 /** Write data from <b>buf</b> to the socket <b>s</b>.  Write at most
 921  * <b>sz</b> bytes, decrement *<b>buf_flushlen</b> by
 922  * the number of bytes actually written, and remove the written bytes
 923  * from the buffer.  Return the number of bytes written on success,
 924  * -1 on failure.  Return 0 if write() would block.
 925  */
 926 int
 927 flush_buf(tor_socket_t s, buf_t *buf, size_t sz, size_t *buf_flushlen)
 928 {
 929   /* XXXX024 It's stupid to overload the return values for these functions:
 930    * "error status" and "number of bytes flushed" are not mutually exclusive.
 931    */
 932   int r;
 933   size_t flushed = 0;
 934   tor_assert(buf_flushlen);
 935   tor_assert(SOCKET_OK(s));
 936   tor_assert(*buf_flushlen <= buf->datalen);
 937   tor_assert(sz <= *buf_flushlen);
 938
 939   check();
 940   while (sz) {
 941     size_t flushlen0;
 942     tor_assert(buf->head);
 943     if (buf->head->datalen >= sz)
 944       flushlen0 = sz;
 945     else
 946       flushlen0 = buf->head->datalen;
 947
 948     r = flush_chunk(s, buf, buf->head, flushlen0, buf_flushlen);
 949     check();
 950     if (r < 0)
 951       return r;
 952     flushed += r;
 953     sz -= r;
 954     if (r == 0 || (size_t)r < flushlen0) /* can't flush any more now. */
 955       break;
 956   }
 957   tor_assert(flushed < INT_MAX);
 958   return (int)flushed;
 959 }
 960
 961 /** As flush_buf(), but writes data to a TLS connection.  Can write more than
 962  * <b>flushlen</b> bytes.
 963  */
 964 int
 965 flush_buf_tls(tor_tls_t *tls, buf_t *buf, size_t flushlen,
 966               size_t *buf_flushlen)
 967 {
 968   int r;
 969   size_t flushed = 0;
 970   ssize_t sz;
 971   tor_assert(buf_flushlen);
 972   tor_assert(*buf_flushlen <= buf->datalen);
 973   tor_assert(flushlen <= *buf_flushlen);
 974   sz = (ssize_t) flushlen;
 975
 976   /* we want to let tls write even if flushlen is zero, because it might
 977    * have a partial record pending */
 978   check_no_tls_errors();
 979
 980   check();
 981   do {
 982     size_t flushlen0;
 983     if (buf->head) {
 984       if ((ssize_t)buf->head->datalen >= sz)
 985         flushlen0 = sz;
 986       else
 987         flushlen0 = buf->head->datalen;
 988     } else {
 989       flushlen0 = 0;
 990     }
 991
 992     r = flush_chunk_tls(tls, buf, buf->head, flushlen0, buf_flushlen);
 993     check();
 994     if (r < 0)
 995       return r;
 996     flushed += r;
 997     sz -= r;
 998     if (r == 0) /* Can't flush any more now. */
 999       break;
1000   } while (sz > 0);
1001   tor_assert(flushed < INT_MAX);
1002   return (int)flushed;
1003 }
1004
1005 /** Append <b>string_len</b> bytes from <b>string</b> to the end of
1006  * <b>buf</b>.
1007  *
1008  * Return the new length of the buffer on success, -1 on failure.
1009  */
1010 int
1011 write_to_buf(const char *string, size_t string_len, buf_t *buf)
1012 {
1013   if (!string_len)
1014     return (int)buf->datalen;
1015   check();
1016
1017   while (string_len) {
1018     size_t copy;
1019     if (!buf->tail || !CHUNK_REMAINING_CAPACITY(buf->tail))
1020       buf_add_chunk_with_capacity(buf, string_len, 1);
1021
1022     copy = CHUNK_REMAINING_CAPACITY(buf->tail);
1023     if (copy > string_len)
1024       copy = string_len;
1025     memcpy(CHUNK_WRITE_PTR(buf->tail), string, copy);
1026     string_len -= copy;
1027     string += copy;
1028     buf->datalen += copy;
1029     buf->tail->datalen += copy;
1030   }
1031
1032   check();
1033   tor_assert(buf->datalen < INT_MAX);
1034   return (int)buf->datalen;
1035 }
1036
1037 /** Helper: copy the first <b>string_len</b> bytes from <b>buf</b>
1038  * onto <b>string</b>.
1039  */
1040 static INLINE void
1041 peek_from_buf(char *string, size_t string_len, const buf_t *buf)
1042 {
1043   chunk_t *chunk;
1044
1045   tor_assert(string);
1046   /* make sure we don't ask for too much */
1047   tor_assert(string_len <= buf->datalen);
1048   /* assert_buf_ok(buf); */
1049
1050   chunk = buf->head;
1051   while (string_len) {
1052     size_t copy = string_len;
1053     tor_assert(chunk);
1054     if (chunk->datalen < copy)
1055       copy = chunk->datalen;
1056     memcpy(string, chunk->data, copy);
1057     string_len -= copy;
1058     string += copy;
1059     chunk = chunk->next;
1060   }
1061 }
1062
1063 /** Remove <b>string_len</b> bytes from the front of <b>buf</b>, and store
1064  * them into <b>string</b>.  Return the new buffer size.  <b>string_len</b>
1065  * must be \<= the number of bytes on the buffer.
1066  */
1067 int
1068 fetch_from_buf(char *string, size_t string_len, buf_t *buf)
1069 {
1070   /* There must be string_len bytes in buf; write them onto string,
1071    * then memmove buf back (that is, remove them from buf).
1072    *
1073    * Return the number of bytes still on the buffer. */
1074
1075   check();
1076   peek_from_buf(string, string_len, buf);
1077   buf_remove_from_front(buf, string_len);
1078   check();
1079   tor_assert(buf->datalen < INT_MAX);
1080   return (int)buf->datalen;
1081 }
1082
1083 /** True iff the cell command <b>command</b> is one that implies a
1084  * variable-length cell in Tor link protocol <b>linkproto</b>. */
1085 static INLINE int
1086 cell_command_is_var_length(uint8_t command, int linkproto)
1087 {
1088   /* If linkproto is v2 (2), CELL_VERSIONS is the only variable-length cells
1089    * work as implemented here. If it's 1, there are no variable-length cells.
1090    * Tor does not support other versions right now, and so can't negotiate
1091    * them.
1092    */
1093   switch (linkproto) {
1094   case 1:
1095     /* Link protocol version 1 has no variable-length cells. */
1096     return 0;
1097   case 2:
1098     /* In link protocol version 2, VERSIONS is the only variable-length cell */
1099     return command == CELL_VERSIONS;
1100   case 0:
1101   case 3:
1102   default:
1103     /* In link protocol version 3 and later, and in version "unknown",
1104      * commands 128 and higher indicate variable-length. VERSIONS is
1105      * grandfathered in. */
1106     return command == CELL_VERSIONS || command >= 128;
1107   }
1108 }
1109
1110 /** Check <b>buf</b> for a variable-length cell according to the rules of link
1111  * protocol version <b>linkproto</b>.  If one is found, pull it off the buffer
1112  * and assign a newly allocated var_cell_t to *<b>out</b>, and return 1.
1113  * Return 0 if whatever is on the start of buf_t is not a variable-length
1114  * cell.  Return 1 and set *<b>out</b> to NULL if there seems to be the start
1115  * of a variable-length cell on <b>buf</b>, but the whole thing isn't there
1116  * yet. */
1117 int
1118 fetch_var_cell_from_buf(buf_t *buf, var_cell_t **out, int linkproto)
1119 {
1120   char hdr[VAR_CELL_MAX_HEADER_SIZE];
1121   var_cell_t *result;
1122   uint8_t command;
1123   uint16_t length;
1124   const int wide_circ_ids = linkproto >= MIN_LINK_PROTO_FOR_WIDE_CIRC_IDS;
1125   const int circ_id_len = get_circ_id_size(wide_circ_ids);
1126   const unsigned header_len = get_var_cell_header_size(wide_circ_ids);
1127   check();
1128   *out = NULL;
1129   if (buf->datalen < header_len)
1130     return 0;
1131   peek_from_buf(hdr, header_len, buf);
1132
1133   command = get_uint8(hdr + circ_id_len);
1134   if (!(cell_command_is_var_length(command, linkproto)))
1135     return 0;
1136
1137   length = ntohs(get_uint16(hdr + circ_id_len + 1));
1138   if (buf->datalen < (size_t)(header_len+length))
1139     return 1;
1140   result = var_cell_new(length);
1141   result->command = command;
1142   if (wide_circ_ids)
1143     result->circ_id = ntohl(get_uint32(hdr));
1144   else
1145     result->circ_id = ntohs(get_uint16(hdr));
1146
1147   buf_remove_from_front(buf, header_len);
1148   peek_from_buf((char*) result->payload, length, buf);
1149   buf_remove_from_front(buf, length);
1150   check();
1151
1152   *out = result;
1153   return 1;
1154 }
1155
1156 #ifdef USE_BUFFEREVENTS
1157 /** Try to read <b>n</b> bytes from <b>buf</b> at <b>pos</b> (which may be
1158  * NULL for the start of the buffer), copying the data only if necessary.  Set
1159  * *<b>data_out</b> to a pointer to the desired bytes.  Set <b>free_out</b>
1160  * to 1 if we needed to malloc *<b>data</b> because the original bytes were
1161  * noncontiguous; 0 otherwise.  Return the number of bytes actually available
1162  * at *<b>data_out</b>.
1163  */
1164 static ssize_t
1165 inspect_evbuffer(struct evbuffer *buf, char **data_out, size_t n,
1166                  int *free_out, struct evbuffer_ptr *pos)
1167 {
1168   int n_vecs, i;
1169
1170   if (evbuffer_get_length(buf) < n)
1171     n = evbuffer_get_length(buf);
1172   if (n == 0)
1173     return 0;
1174   n_vecs = evbuffer_peek(buf, n, pos, NULL, 0);
1175   tor_assert(n_vecs > 0);
1176   if (n_vecs == 1) {
1177     struct evbuffer_iovec v;
1178     i = evbuffer_peek(buf, n, pos, &v, 1);
1179     tor_assert(i == 1);
1180     *data_out = v.iov_base;
1181     *free_out = 0;
1182     return v.iov_len;
1183   } else {
1184     ev_ssize_t copied;
1185     *data_out = tor_malloc(n);
1186     *free_out = 1;
1187     copied = evbuffer_copyout(buf, *data_out, n);
1188     tor_assert(copied >= 0 && (size_t)copied == n);
1189     return copied;
1190   }
1191 }
1192
1193 /** As fetch_var_cell_from_buf, buf works on an evbuffer. */
1194 int
1195 fetch_var_cell_from_evbuffer(struct evbuffer *buf, var_cell_t **out,
1196                              int linkproto)
1197 {
1198   char *hdr = NULL;
1199   int free_hdr = 0;
1200   size_t n;
1201   size_t buf_len;
1202   uint8_t command;
1203   uint16_t cell_length;
1204   var_cell_t *cell;
1205   int result = 0;
1206   const int wide_circ_ids = linkproto >= MIN_LINK_PROTO_FOR_WIDE_CIRC_IDS;
1207   const int circ_id_len = get_circ_id_size(wide_circ_ids);
1208   const unsigned header_len = get_var_cell_header_size(wide_circ_ids);
1209
1210   *out = NULL;
1211   buf_len = evbuffer_get_length(buf);
1212   if (buf_len < header_len)
1213     return 0;
1214
1215   n = inspect_evbuffer(buf, &hdr, header_len, &free_hdr, NULL);
1216   tor_assert(n >= header_len);
1217
1218   command = get_uint8(hdr + circ_id_len);
1219   if (!(cell_command_is_var_length(command, linkproto))) {
1220     goto done;
1221   }
1222
1223   cell_length = ntohs(get_uint16(hdr + circ_id_len + 1));
1224   if (buf_len < (size_t)(header_len+cell_length)) {
1225     result = 1; /* Not all here yet. */
1226     goto done;
1227   }
1228
1229   cell = var_cell_new(cell_length);
1230   cell->command = command;
1231   if (wide_circ_ids)
1232     cell->circ_id = ntohl(get_uint32(hdr));
1233   else
1234     cell->circ_id = ntohs(get_uint16(hdr));
1235   evbuffer_drain(buf, header_len);
1236   evbuffer_remove(buf, cell->payload, cell_length);
1237   *out = cell;
1238   result = 1;
1239
1240  done:
1241   if (free_hdr && hdr)
1242     tor_free(hdr);
1243   return result;
1244 }
1245 #endif
1246
1247 /** Move up to *<b>buf_flushlen</b> bytes from <b>buf_in</b> to
1248  * <b>buf_out</b>, and modify *<b>buf_flushlen</b> appropriately.
1249  * Return the number of bytes actually copied.
1250  */
1251 int
1252 move_buf_to_buf(buf_t *buf_out, buf_t *buf_in, size_t *buf_flushlen)
1253 {
1254   /* We can do way better here, but this doesn't turn up in any profiles. */
1255   char b[4096];
1256   size_t cp, len;
1257   len = *buf_flushlen;
1258   if (len > buf_in->datalen)
1259     len = buf_in->datalen;
1260
1261   cp = len; /* Remember the number of bytes we intend to copy. */
1262   tor_assert(cp < INT_MAX);
1263   while (len) {
1264     /* This isn't the most efficient implementation one could imagine, since
1265      * it does two copies instead of 1, but I kinda doubt that this will be
1266      * critical path. */
1267     size_t n = len > sizeof(b) ? sizeof(b) : len;
1268     fetch_from_buf(b, n, buf_in);
1269     write_to_buf(b, n, buf_out);
1270     len -= n;
1271   }
1272   *buf_flushlen -= cp;
1273   return (int)cp;
1274 }
1275
1276 /** Internal structure: represents a position in a buffer. */
1277 typedef struct buf_pos_t {
1278   const chunk_t *chunk; /**< Which chunk are we pointing to? */
1279   int pos;/**< Which character inside the chunk's data are we pointing to? */
1280   size_t chunk_pos; /**< Total length of all previous chunks. */
1281 } buf_pos_t;
1282
1283 /** Initialize <b>out</b> to point to the first character of <b>buf</b>.*/
1284 static void
1285 buf_pos_init(const buf_t *buf, buf_pos_t *out)
1286 {
1287   out->chunk = buf->head;
1288   out->pos = 0;
1289   out->chunk_pos = 0;
1290 }
1291
1292 /** Advance <b>out</b> to the first appearance of <b>ch</b> at the current
1293  * position of <b>out</b>, or later.  Return -1 if no instances are found;
1294  * otherwise returns the absolute position of the character. */
1295 static off_t
1296 buf_find_pos_of_char(char ch, buf_pos_t *out)
1297 {
1298   const chunk_t *chunk;
1299   int pos;
1300   tor_assert(out);
1301   if (out->chunk) {
1302     if (out->chunk->datalen) {
1303       tor_assert(out->pos < (off_t)out->chunk->datalen);
1304     } else {
1305       tor_assert(out->pos == 0);
1306     }
1307   }
1308   pos = out->pos;
1309   for (chunk = out->chunk; chunk; chunk = chunk->next) {
1310     char *cp = memchr(chunk->data+pos, ch, chunk->datalen - pos);
1311     if (cp) {
1312       out->chunk = chunk;
1313       tor_assert(cp - chunk->data < INT_MAX);
1314       out->pos = (int)(cp - chunk->data);
1315       return out->chunk_pos + out->pos;
1316     } else {
1317       out->chunk_pos += chunk->datalen;
1318       pos = 0;
1319     }
1320   }
1321   return -1;
1322 }
1323
1324 /** Advance <b>pos</b> by a single character, if there are any more characters
1325  * in the buffer.  Returns 0 on success, -1 on failure. */
1326 static INLINE int
1327 buf_pos_inc(buf_pos_t *pos)
1328 {
1329   ++pos->pos;
1330   if (pos->pos == (off_t)pos->chunk->datalen) {
1331     if (!pos->chunk->next)
1332       return -1;
1333     pos->chunk_pos += pos->chunk->datalen;
1334     pos->chunk = pos->chunk->next;
1335     pos->pos = 0;
1336   }
1337   return 0;
1338 }
1339
1340 /** Return true iff the <b>n</b>-character string in <b>s</b> appears
1341  * (verbatim) at <b>pos</b>. */
1342 static int
1343 buf_matches_at_pos(const buf_pos_t *pos, const char *s, size_t n)
1344 {
1345   buf_pos_t p;
1346   if (!n)
1347     return 1;
1348
1349   memcpy(&p, pos, sizeof(p));
1350
1351   while (1) {
1352     char ch = p.chunk->data[p.pos];
1353     if (ch != *s)
1354       return 0;
1355     ++s;
1356     /* If we're out of characters that don't match, we match.  Check this
1357      * _before_ we test incrementing pos, in case we're at the end of the
1358      * string. */
1359     if (--n == 0)
1360       return 1;
1361     if (buf_pos_inc(&p)<0)
1362       return 0;
1363   }
1364 }
1365
1366 /** Return the first position in <b>buf</b> at which the <b>n</b>-character
1367  * string <b>s</b> occurs, or -1 if it does not occur. */
1368 STATIC int
1369 buf_find_string_offset(const buf_t *buf, const char *s, size_t n)
1370 {
1371   buf_pos_t pos;
1372   buf_pos_init(buf, &pos);
1373   while (buf_find_pos_of_char(*s, &pos) >= 0) {
1374     if (buf_matches_at_pos(&pos, s, n)) {
1375       tor_assert(pos.chunk_pos + pos.pos < INT_MAX);
1376       return (int)(pos.chunk_pos + pos.pos);
1377     } else {
1378       if (buf_pos_inc(&pos)<0)
1379         return -1;
1380     }
1381   }
1382   return -1;
1383 }
1384
1385 /** There is a (possibly incomplete) http statement on <b>buf</b>, of the
1386  * form "\%s\\r\\n\\r\\n\%s", headers, body. (body may contain NULs.)
1387  * If a) the headers include a Content-Length field and all bytes in
1388  * the body are present, or b) there's no Content-Length field and
1389  * all headers are present, then:
1390  *
1391  *  - strdup headers into <b>*headers_out</b>, and NUL-terminate it.
1392  *  - memdup body into <b>*body_out</b>, and NUL-terminate it.
1393  *  - Then remove them from <b>buf</b>, and return 1.
1394  *
1395  *  - If headers or body is NULL, discard that part of the buf.
1396  *  - If a headers or body doesn't fit in the arg, return -1.
1397  *  (We ensure that the headers or body don't exceed max len,
1398  *   _even if_ we're planning to discard them.)
1399  *  - If force_complete is true, then succeed even if not all of the
1400  *    content has arrived.
1401  *
1402  * Else, change nothing and return 0.
1403  */
1404 int
1405 fetch_from_buf_http(buf_t *buf,
1406                     char **headers_out, size_t max_headerlen,
1407                     char **body_out, size_t *body_used, size_t max_bodylen,
1408                     int force_complete)
1409 {
1410   char *headers, *p;
1411   size_t headerlen, bodylen, contentlen;
1412   int crlf_offset;
1413
1414   check();
1415   if (!buf->head)
1416     return 0;
1417
1418   crlf_offset = buf_find_string_offset(buf, "\r\n\r\n", 4);
1419   if (crlf_offset > (int)max_headerlen ||
1420       (crlf_offset < 0 && buf->datalen > max_headerlen)) {
1421     log_debug(LD_HTTP,"headers too long.");
1422     return -1;
1423   } else if (crlf_offset < 0) {
1424     log_debug(LD_HTTP,"headers not all here yet.");
1425     return 0;
1426   }
1427   /* Okay, we have a full header.  Make sure it all appears in the first
1428    * chunk. */
1429   if ((int)buf->head->datalen < crlf_offset + 4)
1430     buf_pullup(buf, crlf_offset+4, 0);
1431   headerlen = crlf_offset + 4;
1432
1433   headers = buf->head->data;
1434   bodylen = buf->datalen - headerlen;
1435   log_debug(LD_HTTP,"headerlen %d, bodylen %d.", (int)headerlen, (int)bodylen);
1436
1437   if (max_headerlen <= headerlen) {
1438     log_warn(LD_HTTP,"headerlen %d larger than %d. Failing.",
1439              (int)headerlen, (int)max_headerlen-1);
1440     return -1;
1441   }
1442   if (max_bodylen <= bodylen) {
1443     log_warn(LD_HTTP,"bodylen %d larger than %d. Failing.",
1444              (int)bodylen, (int)max_bodylen-1);
1445     return -1;
1446   }
1447
1448 #define CONTENT_LENGTH "\r\nContent-Length: "
1449   p = (char*) tor_memstr(headers, headerlen, CONTENT_LENGTH);
1450   if (p) {
1451     int i;
1452     i = atoi(p+strlen(CONTENT_LENGTH));
1453     if (i < 0) {
1454       log_warn(LD_PROTOCOL, "Content-Length is less than zero; it looks like "
1455                "someone is trying to crash us.");
1456       return -1;
1457     }
1458     contentlen = i;
1459     /* if content-length is malformed, then our body length is 0. fine. */
1460     log_debug(LD_HTTP,"Got a contentlen of %d.",(int)contentlen);
1461     if (bodylen < contentlen) {
1462       if (!force_complete) {
1463         log_debug(LD_HTTP,"body not all here yet.");
1464         return 0; /* not all there yet */
1465       }
1466     }
1467     if (bodylen > contentlen) {
1468       bodylen = contentlen;
1469       log_debug(LD_HTTP,"bodylen reduced to %d.",(int)bodylen);
1470     }
1471   }
1472   /* all happy. copy into the appropriate places, and return 1 */
1473   if (headers_out) {
1474     *headers_out = tor_malloc(headerlen+1);
1475     fetch_from_buf(*headers_out, headerlen, buf);
1476     (*headers_out)[headerlen] = 0; /* NUL terminate it */
1477   }
1478   if (body_out) {
1479     tor_assert(body_used);
1480     *body_used = bodylen;
1481     *body_out = tor_malloc(bodylen+1);
1482     fetch_from_buf(*body_out, bodylen, buf);
1483     (*body_out)[bodylen] = 0; /* NUL terminate it */
1484   }
1485   check();
1486   return 1;
1487 }
1488
1489 #ifdef USE_BUFFEREVENTS
1490 /** As fetch_from_buf_http, buf works on an evbuffer. */
1491 int
1492 fetch_from_evbuffer_http(struct evbuffer *buf,
1493                     char **headers_out, size_t max_headerlen,
1494                     char **body_out, size_t *body_used, size_t max_bodylen,
1495                     int force_complete)
1496 {
1497   struct evbuffer_ptr crlf, content_length;
1498   size_t headerlen, bodylen, contentlen;
1499
1500   /* Find the first \r\n\r\n in the buffer */
1501   crlf = evbuffer_search(buf, "\r\n\r\n", 4, NULL);
1502   if (crlf.pos < 0) {
1503     /* We didn't find one. */
1504     if (evbuffer_get_length(buf) > max_headerlen)
1505       return -1; /* Headers too long. */
1506     return 0; /* Headers not here yet. */
1507   } else if (crlf.pos > (int)max_headerlen) {
1508     return -1; /* Headers too long. */
1509   }
1510
1511   headerlen = crlf.pos + 4;  /* Skip over the \r\n\r\n */
1512   bodylen = evbuffer_get_length(buf) - headerlen;
1513   if (bodylen > max_bodylen)
1514     return -1; /* body too long */
1515
1516   /* Look for the first occurrence of CONTENT_LENGTH insize buf before the
1517    * crlfcrlf */
1518   content_length = evbuffer_search_range(buf, CONTENT_LENGTH,
1519                                          strlen(CONTENT_LENGTH), NULL, &crlf);
1520
1521   if (content_length.pos >= 0) {
1522     /* We found a content_length: parse it and figure out if the body is here
1523      * yet. */
1524     struct evbuffer_ptr eol;
1525     char *data = NULL;
1526     int free_data = 0;
1527     int n, i;
1528     n = evbuffer_ptr_set(buf, &content_length, strlen(CONTENT_LENGTH),
1529                          EVBUFFER_PTR_ADD);
1530     tor_assert(n == 0);
1531     eol = evbuffer_search_eol(buf, &content_length, NULL, EVBUFFER_EOL_CRLF);
1532     tor_assert(eol.pos > content_length.pos);
1533     tor_assert(eol.pos <= crlf.pos);
1534     inspect_evbuffer(buf, &data, eol.pos - content_length.pos, &free_data,
1535                          &content_length);
1536
1537     i = atoi(data);
1538     if (free_data)
1539       tor_free(data);
1540     if (i < 0) {
1541       log_warn(LD_PROTOCOL, "Content-Length is less than zero; it looks like "
1542                "someone is trying to crash us.");
1543       return -1;
1544     }
1545     contentlen = i;
1546     /* if content-length is malformed, then our body length is 0. fine. */
1547     log_debug(LD_HTTP,"Got a contentlen of %d.",(int)contentlen);
1548     if (bodylen < contentlen) {
1549       if (!force_complete) {
1550         log_debug(LD_HTTP,"body not all here yet.");
1551         return 0; /* not all there yet */
1552       }
1553     }
1554     if (bodylen > contentlen) {
1555       bodylen = contentlen;
1556       log_debug(LD_HTTP,"bodylen reduced to %d.",(int)bodylen);
1557     }
1558   }
1559
1560   if (headers_out) {
1561     *headers_out = tor_malloc(headerlen+1);
1562     evbuffer_remove(buf, *headers_out, headerlen);
1563     (*headers_out)[headerlen] = '\0';
1564   }
1565   if (body_out) {
1566     tor_assert(headers_out);
1567     tor_assert(body_used);
1568     *body_used = bodylen;
1569     *body_out = tor_malloc(bodylen+1);
1570     evbuffer_remove(buf, *body_out, bodylen);
1571     (*body_out)[bodylen] = '\0';
1572   }
1573   return 1;
1574 }
1575 #endif
1576
1577 /**
1578  * Wait this many seconds before warning the user about using SOCKS unsafely
1579  * again (requires that WarnUnsafeSocks is turned on). */
1580 #define SOCKS_WARN_INTERVAL 5
1581
1582 /** Warn that the user application has made an unsafe socks request using
1583  * protocol <b>socks_protocol</b> on port <b>port</b>.  Don't warn more than
1584  * once per SOCKS_WARN_INTERVAL, unless <b>safe_socks</b> is set. */
1585 static void
1586 log_unsafe_socks_warning(int socks_protocol, const char *address,
1587                          uint16_t port, int safe_socks)
1588 {
1589   static ratelim_t socks_ratelim = RATELIM_INIT(SOCKS_WARN_INTERVAL);
1590
1591   const or_options_t *options = get_options();
1592   if (! options->WarnUnsafeSocks)
1593     return;
1594   if (safe_socks) {
1595     log_fn_ratelim(&socks_ratelim, LOG_WARN, LD_APP,
1596              "Your application (using socks%d to port %d) is giving "
1597              "Tor only an IP address. Applications that do DNS resolves "
1598              "themselves may leak information. Consider using Socks4A "
1599              "(e.g. via privoxy or socat) instead. For more information, "
1600              "please see https://wiki.torproject.org/TheOnionRouter/"
1601              "TorFAQ#SOCKSAndDNS.%s",
1602              socks_protocol,
1603              (int)port,
1604              safe_socks ? " Rejecting." : "");
1605   }
1606   control_event_client_status(LOG_WARN,
1607                               "DANGEROUS_SOCKS PROTOCOL=SOCKS%d ADDRESS=%s:%d",
1608                               socks_protocol, address, (int)port);
1609 }
1610
1611 /** Do not attempt to parse socks messages longer than this.  This value is
1612  * actually significantly higher than the longest possible socks message. */
1613 #define MAX_SOCKS_MESSAGE_LEN 512
1614
1615 /** Return a new socks_request_t. */
1616 socks_request_t *
1617 socks_request_new(void)
1618 {
1619   return tor_malloc_zero(sizeof(socks_request_t));
1620 }
1621
1622 /** Free all storage held in the socks_request_t <b>req</b>. */
1623 void
1624 socks_request_free(socks_request_t *req)
1625 {
1626   if (!req)
1627     return;
1628   if (req->username) {
1629     memwipe(req->username, 0x10, req->usernamelen);
1630     tor_free(req->username);
1631   }
1632   if (req->password) {
1633     memwipe(req->password, 0x04, req->passwordlen);
1634     tor_free(req->password);
1635   }
1636   memwipe(req, 0xCC, sizeof(socks_request_t));
1637   tor_free(req);
1638 }
1639
1640 /** There is a (possibly incomplete) socks handshake on <b>buf</b>, of one
1641  * of the forms
1642  *  - socks4: "socksheader username\\0"
1643  *  - socks4a: "socksheader username\\0 destaddr\\0"
1644  *  - socks5 phase one: "version #methods methods"
1645  *  - socks5 phase two: "version command 0 addresstype..."
1646  * If it's a complete and valid handshake, and destaddr fits in
1647  *   MAX_SOCKS_ADDR_LEN bytes, then pull the handshake off the buf,
1648  *   assign to <b>req</b>, and return 1.
1649  *
1650  * If it's invalid or too big, return -1.
1651  *
1652  * Else it's not all there yet, leave buf alone and return 0.
1653  *
1654  * If you want to specify the socks reply, write it into <b>req->reply</b>
1655  *   and set <b>req->replylen</b>, else leave <b>req->replylen</b> alone.
1656  *
1657  * If <b>log_sockstype</b> is non-zero, then do a notice-level log of whether
1658  * the connection is possibly leaking DNS requests locally or not.
1659  *
1660  * If <b>safe_socks</b> is true, then reject unsafe socks protocols.
1661  *
1662  * If returning 0 or -1, <b>req->address</b> and <b>req->port</b> are
1663  * undefined.
1664  */
1665 int
1666 fetch_from_buf_socks(buf_t *buf, socks_request_t *req,
1667                      int log_sockstype, int safe_socks)
1668 {
1669   int res;
1670   ssize_t n_drain;
1671   size_t want_length = 128;
1672
1673   if (buf->datalen < 2) /* version and another byte */
1674     return 0;
1675
1676   do {
1677     n_drain = 0;
1678     buf_pullup(buf, want_length, 0);
1679     tor_assert(buf->head && buf->head->datalen >= 2);
1680     want_length = 0;
1681
1682     res = parse_socks(buf->head->data, buf->head->datalen, req, log_sockstype,
1683                       safe_socks, &n_drain, &want_length);
1684
1685     if (n_drain < 0)
1686       buf_clear(buf);
1687     else if (n_drain > 0)
1688       buf_remove_from_front(buf, n_drain);
1689
1690   } while (res == 0 && buf->head && want_length < buf->datalen &&
1691            buf->datalen >= 2);
1692
1693   return res;
1694 }
1695
1696 #ifdef USE_BUFFEREVENTS
1697 /* As fetch_from_buf_socks(), but targets an evbuffer instead. */
1698 int
1699 fetch_from_evbuffer_socks(struct evbuffer *buf, socks_request_t *req,
1700                           int log_sockstype, int safe_socks)
1701 {
1702   char *data;
1703   ssize_t n_drain;
1704   size_t datalen, buflen, want_length;
1705   int res;
1706
1707   buflen = evbuffer_get_length(buf);
1708   if (buflen < 2)
1709     return 0;
1710
1711   {
1712     /* See if we can find the socks request in the first chunk of the buffer.
1713      */
1714     struct evbuffer_iovec v;
1715     int i;
1716     n_drain = 0;
1717     i = evbuffer_peek(buf, -1, NULL, &v, 1);
1718     tor_assert(i == 1);
1719     data = v.iov_base;
1720     datalen = v.iov_len;
1721     want_length = 0;
1722
1723     res = parse_socks(data, datalen, req, log_sockstype,
1724                       safe_socks, &n_drain, &want_length);
1725
1726     if (n_drain < 0)
1727       evbuffer_drain(buf, evbuffer_get_length(buf));
1728     else if (n_drain > 0)
1729       evbuffer_drain(buf, n_drain);
1730
1731     if (res)
1732       return res;
1733   }
1734
1735   /* Okay, the first chunk of the buffer didn't have a complete socks request.
1736    * That means that either we don't have a whole socks request at all, or
1737    * it's gotten split up.  We're going to try passing parse_socks() bigger
1738    * and bigger chunks until either it says "Okay, I got it", or it says it
1739    * will need more data than we currently have. */
1740
1741   /* Loop while we have more data that we haven't given parse_socks() yet. */
1742   do {
1743     int free_data = 0;
1744     const size_t last_wanted = want_length;
1745     n_drain = 0;
1746     data = NULL;
1747     datalen = inspect_evbuffer(buf, &data, want_length, &free_data, NULL);
1748
1749     want_length = 0;
1750     res = parse_socks(data, datalen, req, log_sockstype,
1751                       safe_socks, &n_drain, &want_length);
1752
1753     if (free_data)
1754       tor_free(data);
1755
1756     if (n_drain < 0)
1757       evbuffer_drain(buf, evbuffer_get_length(buf));
1758     else if (n_drain > 0)
1759       evbuffer_drain(buf, n_drain);
1760
1761     if (res == 0 && n_drain == 0 && want_length <= last_wanted) {
1762       /* If we drained nothing, and we didn't ask for more than last time,
1763        * then we probably wanted more data than the buffer actually had,
1764        * and we're finding out that we're not satisified with it. It's
1765        * time to break until we have more data. */
1766       break;
1767     }
1768
1769     buflen = evbuffer_get_length(buf);
1770   } while (res == 0 && want_length <= buflen && buflen >= 2);
1771
1772   return res;
1773 }
1774 #endif
1775
1776 /** The size of the header of an Extended ORPort message: 2 bytes for
1777  *  COMMAND, 2 bytes for BODYLEN */
1778 #define EXT_OR_CMD_HEADER_SIZE 4
1779
1780 /** Read <b>buf</b>, which should contain an Extended ORPort message
1781  *  from a transport proxy. If well-formed, create and populate
1782  *  <b>out</b> with the Extended ORport message. Return 0 if the
1783  *  buffer was incomplete, 1 if it was well-formed and -1 if we
1784  *  encountered an error while parsing it.  */
1785 int
1786 fetch_ext_or_command_from_buf(buf_t *buf, ext_or_cmd_t **out)
1787 {
1788   char hdr[EXT_OR_CMD_HEADER_SIZE];
1789   uint16_t len;
1790
1791   check();
1792   if (buf->datalen < EXT_OR_CMD_HEADER_SIZE)
1793     return 0;
1794   peek_from_buf(hdr, sizeof(hdr), buf);
1795   len = ntohs(get_uint16(hdr+2));
1796   if (buf->datalen < (unsigned)len + EXT_OR_CMD_HEADER_SIZE)
1797     return 0;
1798   *out = ext_or_cmd_new(len);
1799   (*out)->cmd = ntohs(get_uint16(hdr));
1800   (*out)->len = len;
1801   buf_remove_from_front(buf, EXT_OR_CMD_HEADER_SIZE);
1802   fetch_from_buf((*out)->body, len, buf);
1803   return 1;
1804 }
1805
1806 #ifdef USE_BUFFEREVENTS
1807 /** Read <b>buf</b>, which should contain an Extended ORPort message
1808  *  from a transport proxy. If well-formed, create and populate
1809  *  <b>out</b> with the Extended ORport message. Return 0 if the
1810  *  buffer was incomplete, 1 if it was well-formed and -1 if we
1811  *  encountered an error while parsing it.  */
1812 int
1813 fetch_ext_or_command_from_evbuffer(struct evbuffer *buf, ext_or_cmd_t **out)
1814 {
1815   char hdr[EXT_OR_CMD_HEADER_SIZE];
1816   uint16_t len;
1817   size_t buf_len = evbuffer_get_length(buf);
1818
1819   if (buf_len < EXT_OR_CMD_HEADER_SIZE)
1820     return 0;
1821   evbuffer_copyout(buf, hdr, EXT_OR_CMD_HEADER_SIZE);
1822   len = ntohs(get_uint16(hdr+2));
1823   if (buf_len < (unsigned)len + EXT_OR_CMD_HEADER_SIZE)
1824     return 0;
1825   *out = ext_or_cmd_new(len);
1826   (*out)->cmd = ntohs(get_uint16(hdr));
1827   (*out)->len = len;
1828   evbuffer_drain(buf, EXT_OR_CMD_HEADER_SIZE);
1829   evbuffer_remove(buf, (*out)->body, len);
1830   return 1;
1831 }
1832 #endif
1833
1834 /** Implementation helper to implement fetch_from_*_socks.  Instead of looking
1835  * at a buffer's contents, we look at the <b>datalen</b> bytes of data in
1836  * <b>data</b>. Instead of removing data from the buffer, we set
1837  * <b>drain_out</b> to the amount of data that should be removed (or -1 if the
1838  * buffer should be cleared).  Instead of pulling more data into the first
1839  * chunk of the buffer, we set *<b>want_length_out</b> to the number of bytes
1840  * we'd like to see in the input buffer, if they're available. */
1841 static int
1842 parse_socks(const char *data, size_t datalen, socks_request_t *req,
1843             int log_sockstype, int safe_socks, ssize_t *drain_out,
1844             size_t *want_length_out)
1845 {
1846   unsigned int len;
1847   char tmpbuf[TOR_ADDR_BUF_LEN+1];
1848   tor_addr_t destaddr;
1849   uint32_t destip;
1850   uint8_t socksver;
1851   char *next, *startaddr;
1852   unsigned char usernamelen, passlen;
1853   struct in_addr in;
1854
1855   if (datalen < 2) {
1856     /* We always need at least 2 bytes. */
1857     *want_length_out = 2;
1858     return 0;
1859   }
1860
1861   if (req->socks_version == 5 && !req->got_auth) {
1862     /* See if we have received authentication.  Strictly speaking, we should
1863        also check whether we actually negotiated username/password
1864        authentication.  But some broken clients will send us authentication
1865        even if we negotiated SOCKS_NO_AUTH. */
1866     if (*data == 1) { /* username/pass version 1 */
1867       /* Format is: authversion [1 byte] == 1
1868                     usernamelen [1 byte]
1869                     username    [usernamelen bytes]
1870                     passlen     [1 byte]
1871                     password    [passlen bytes] */
1872       usernamelen = (unsigned char)*(data + 1);
1873       if (datalen < 2u + usernamelen + 1u) {
1874         *want_length_out = 2u + usernamelen + 1u;
1875         return 0;
1876       }
1877       passlen = (unsigned char)*(data + 2u + usernamelen);
1878       if (datalen < 2u + usernamelen + 1u + passlen) {
1879         *want_length_out = 2u + usernamelen + 1u + passlen;
1880         return 0;
1881       }
1882       req->replylen = 2; /* 2 bytes of response */
1883       req->reply[0] = 1; /* authversion == 1 */
1884       req->reply[1] = 0; /* authentication successful */
1885       log_debug(LD_APP,
1886                "socks5: Accepted username/password without checking.");
1887       if (usernamelen) {
1888         req->username = tor_memdup(data+2u, usernamelen);
1889         req->usernamelen = usernamelen;
1890       }
1891       if (passlen) {
1892         req->password = tor_memdup(data+3u+usernamelen, passlen);
1893         req->passwordlen = passlen;
1894       }
1895       *drain_out = 2u + usernamelen + 1u + passlen;
1896       req->got_auth = 1;
1897       *want_length_out = 7; /* Minimal socks5 sommand. */
1898       return 0;
1899     } else if (req->auth_type == SOCKS_USER_PASS) {
1900       /* unknown version byte */
1901       log_warn(LD_APP, "Socks5 username/password version %d not recognized; "
1902                "rejecting.", (int)*data);
1903       return -1;
1904     }
1905   }
1906
1907   socksver = *data;
1908
1909   switch (socksver) { /* which version of socks? */
1910     case 5: /* socks5 */
1911
1912       if (req->socks_version != 5) { /* we need to negotiate a method */
1913         unsigned char nummethods = (unsigned char)*(data+1);
1914         int have_user_pass, have_no_auth;
1915         int r=0;
1916         tor_assert(!req->socks_version);
1917         if (datalen < 2u+nummethods) {
1918           *want_length_out = 2u+nummethods;
1919           return 0;
1920         }
1921         if (!nummethods)
1922           return -1;
1923         req->replylen = 2; /* 2 bytes of response */
1924         req->reply[0] = 5; /* socks5 reply */
1925         have_user_pass = (memchr(data+2, SOCKS_USER_PASS, nummethods) !=NULL);
1926         have_no_auth   = (memchr(data+2, SOCKS_NO_AUTH,   nummethods) !=NULL);
1927         if (have_user_pass && !(have_no_auth && req->socks_prefer_no_auth)) {
1928           req->auth_type = SOCKS_USER_PASS;
1929           req->reply[1] = SOCKS_USER_PASS; /* tell client to use "user/pass"
1930                                               auth method */
1931           req->socks_version = 5; /* remember we've already negotiated auth */
1932           log_debug(LD_APP,"socks5: accepted method 2 (username/password)");
1933           r=0;
1934         } else if (have_no_auth) {
1935           req->reply[1] = SOCKS_NO_AUTH; /* tell client to use "none" auth
1936                                             method */
1937           req->socks_version = 5; /* remember we've already negotiated auth */
1938           log_debug(LD_APP,"socks5: accepted method 0 (no authentication)");
1939           r=0;
1940         } else {
1941           log_warn(LD_APP,
1942                     "socks5: offered methods don't include 'no auth' or "
1943                     "username/password. Rejecting.");
1944           req->reply[1] = '\xFF'; /* reject all methods */
1945           r=-1;
1946         }
1947         /* Remove packet from buf. Some SOCKS clients will have sent extra
1948          * junk at this point; let's hope it's an authentication message. */
1949         *drain_out = 2u + nummethods;
1950
1951         return r;
1952       }
1953       if (req->auth_type != SOCKS_NO_AUTH && !req->got_auth) {
1954         log_warn(LD_APP,
1955                  "socks5: negotiated authentication, but none provided");
1956         return -1;
1957       }
1958       /* we know the method; read in the request */
1959       log_debug(LD_APP,"socks5: checking request");
1960       if (datalen < 7) {/* basic info plus >=1 for addr plus 2 for port */
1961         *want_length_out = 7;
1962         return 0; /* not yet */
1963       }
1964       req->command = (unsigned char) *(data+1);
1965       if (req->command != SOCKS_COMMAND_CONNECT &&
1966           req->command != SOCKS_COMMAND_RESOLVE &&
1967           req->command != SOCKS_COMMAND_RESOLVE_PTR) {
1968         /* not a connect or resolve or a resolve_ptr? we don't support it. */
1969         log_warn(LD_APP,"socks5: command %d not recognized. Rejecting.",
1970                  req->command);
1971         return -1;
1972       }
1973       switch (*(data+3)) { /* address type */
1974         case 1: /* IPv4 address */
1975         case 4: /* IPv6 address */ {
1976           const int is_v6 = *(data+3) == 4;
1977           const unsigned addrlen = is_v6 ? 16 : 4;
1978           log_debug(LD_APP,"socks5: ipv4 address type");
1979           if (datalen < 6+addrlen) {/* ip/port there? */
1980             *want_length_out = 6+addrlen;
1981             return 0; /* not yet */
1982           }
1983
1984           if (is_v6)
1985             tor_addr_from_ipv6_bytes(&destaddr, data+4);
1986           else
1987             tor_addr_from_ipv4n(&destaddr, get_uint32(data+4));
1988
1989           tor_addr_to_str(tmpbuf, &destaddr, sizeof(tmpbuf), 1);
1990
1991           if (strlen(tmpbuf)+1 > MAX_SOCKS_ADDR_LEN) {
1992             log_warn(LD_APP,
1993                      "socks5 IP takes %d bytes, which doesn't fit in %d. "
1994                      "Rejecting.",
1995                      (int)strlen(tmpbuf)+1,(int)MAX_SOCKS_ADDR_LEN);
1996             return -1;
1997           }
1998           strlcpy(req->address,tmpbuf,sizeof(req->address));
1999           req->port = ntohs(get_uint16(data+4+addrlen));
2000           *drain_out = 6+addrlen;
2001           if (req->command != SOCKS_COMMAND_RESOLVE_PTR &&
2002               !addressmap_have_mapping(req->address,0)) {
2003             log_unsafe_socks_warning(5, req->address, req->port, safe_socks);
2004             if (safe_socks)
2005               return -1;
2006           }
2007           return 1;
2008         }
2009         case 3: /* fqdn */
2010           log_debug(LD_APP,"socks5: fqdn address type");
2011           if (req->command == SOCKS_COMMAND_RESOLVE_PTR) {
2012             log_warn(LD_APP, "socks5 received RESOLVE_PTR command with "
2013                      "hostname type. Rejecting.");
2014             return -1;
2015           }
2016           len = (unsigned char)*(data+4);
2017           if (datalen < 7+len) { /* addr/port there? */
2018             *want_length_out = 7+len;
2019             return 0; /* not yet */
2020           }
2021           if (len+1 > MAX_SOCKS_ADDR_LEN) {
2022             log_warn(LD_APP,
2023                      "socks5 hostname is %d bytes, which doesn't fit in "
2024                      "%d. Rejecting.", len+1,MAX_SOCKS_ADDR_LEN);
2025             return -1;
2026           }
2027           memcpy(req->address,data+5,len);
2028           req->address[len] = 0;
2029           req->port = ntohs(get_uint16(data+5+len));
2030           *drain_out = 5+len+2;
2031           if (!tor_strisprint(req->address) || strchr(req->address,'\"')) {
2032             log_warn(LD_PROTOCOL,
2033                      "Your application (using socks5 to port %d) gave Tor "
2034                      "a malformed hostname: %s. Rejecting the connection.",
2035                      req->port, escaped(req->address));
2036             return -1;
2037           }
2038           if (log_sockstype)
2039             log_notice(LD_APP,
2040                   "Your application (using socks5 to port %d) instructed "
2041                   "Tor to take care of the DNS resolution itself if "
2042                   "necessary. This is good.", req->port);
2043           return 1;
2044         default: /* unsupported */
2045           log_warn(LD_APP,"socks5: unsupported address type %d. Rejecting.",
2046                    (int) *(data+3));
2047           return -1;
2048       }
2049       tor_assert(0);
2050     case 4: { /* socks4 */
2051       enum {socks4, socks4a} socks4_prot = socks4a;
2052       const char *authstart, *authend;
2053       /* http://ss5.sourceforge.net/socks4.protocol.txt */
2054       /* http://ss5.sourceforge.net/socks4A.protocol.txt */
2055
2056       req->socks_version = 4;
2057       if (datalen < SOCKS4_NETWORK_LEN) {/* basic info available? */
2058         *want_length_out = SOCKS4_NETWORK_LEN;
2059         return 0; /* not yet */
2060       }
2061       // buf_pullup(buf, 1280, 0);
2062       req->command = (unsigned char) *(data+1);
2063       if (req->command != SOCKS_COMMAND_CONNECT &&
2064           req->command != SOCKS_COMMAND_RESOLVE) {
2065         /* not a connect or resolve? we don't support it. (No resolve_ptr with
2066          * socks4.) */
2067         log_warn(LD_APP,"socks4: command %d not recognized. Rejecting.",
2068                  req->command);
2069         return -1;
2070       }
2071
2072       req->port = ntohs(get_uint16(data+2));
2073       destip = ntohl(get_uint32(data+4));
2074       if ((!req->port && req->command!=SOCKS_COMMAND_RESOLVE) || !destip) {
2075         log_warn(LD_APP,"socks4: Port or DestIP is zero. Rejecting.");
2076         return -1;
2077       }
2078       if (destip >> 8) {
2079         log_debug(LD_APP,"socks4: destip not in form 0.0.0.x.");
2080         in.s_addr = htonl(destip);
2081         tor_inet_ntoa(&in,tmpbuf,sizeof(tmpbuf));
2082         if (strlen(tmpbuf)+1 > MAX_SOCKS_ADDR_LEN) {
2083           log_debug(LD_APP,"socks4 addr (%d bytes) too long. Rejecting.",
2084                     (int)strlen(tmpbuf));
2085           return -1;
2086         }
2087         log_debug(LD_APP,
2088                   "socks4: successfully read destip (%s)",
2089                   safe_str_client(tmpbuf));
2090         socks4_prot = socks4;
2091       }
2092
2093       authstart = data + SOCKS4_NETWORK_LEN;
2094       next = memchr(authstart, 0,
2095                     datalen-SOCKS4_NETWORK_LEN);
2096       if (!next) {
2097         if (datalen >= 1024) {
2098           log_debug(LD_APP, "Socks4 user name too long; rejecting.");
2099           return -1;
2100         }
2101         log_debug(LD_APP,"socks4: Username not here yet.");
2102         *want_length_out = datalen+1024; /* More than we need, but safe */
2103         return 0;
2104       }
2105       authend = next;
2106       tor_assert(next < data+datalen);
2107
2108       startaddr = NULL;
2109       if (socks4_prot != socks4a &&
2110           !addressmap_have_mapping(tmpbuf,0)) {
2111         log_unsafe_socks_warning(4, tmpbuf, req->port, safe_socks);
2112
2113         if (safe_socks)
2114           return -1;
2115       }
2116       if (socks4_prot == socks4a) {
2117         if (next+1 == data+datalen) {
2118           log_debug(LD_APP,"socks4: No part of destaddr here yet.");
2119           *want_length_out = datalen + 1024; /* More than we need, but safe */
2120           return 0;
2121         }
2122         startaddr = next+1;
2123         next = memchr(startaddr, 0, data + datalen - startaddr);
2124         if (!next) {
2125           if (datalen >= 1024) {
2126             log_debug(LD_APP,"socks4: Destaddr too long.");
2127             return -1;
2128           }
2129           log_debug(LD_APP,"socks4: Destaddr not all here yet.");
2130           *want_length_out = datalen + 1024; /* More than we need, but safe */
2131           return 0;
2132         }
2133         if (MAX_SOCKS_ADDR_LEN <= next-startaddr) {
2134           log_warn(LD_APP,"socks4: Destaddr too long. Rejecting.");
2135           return -1;
2136         }
2137         // tor_assert(next < buf->cur+buf->datalen);
2138
2139         if (log_sockstype)
2140           log_notice(LD_APP,
2141                      "Your application (using socks4a to port %d) instructed "
2142                      "Tor to take care of the DNS resolution itself if "
2143                      "necessary. This is good.", req->port);
2144       }
2145       log_debug(LD_APP,"socks4: Everything is here. Success.");
2146       strlcpy(req->address, startaddr ? startaddr : tmpbuf,
2147               sizeof(req->address));
2148       if (!tor_strisprint(req->address) || strchr(req->address,'\"')) {
2149         log_warn(LD_PROTOCOL,
2150                  "Your application (using socks4 to port %d) gave Tor "
2151                  "a malformed hostname: %s. Rejecting the connection.",
2152                  req->port, escaped(req->address));
2153         return -1;
2154       }
2155       if (authend != authstart) {
2156         req->got_auth = 1;
2157         req->usernamelen = authend - authstart;
2158         req->username = tor_memdup(authstart, authend - authstart);
2159       }
2160       /* next points to the final \0 on inbuf */
2161       *drain_out = next - data + 1;
2162       return 1;
2163     }
2164     case 'G': /* get */
2165     case 'H': /* head */
2166     case 'P': /* put/post */
2167     case 'C': /* connect */
2168       strlcpy((char*)req->reply,
2169 "HTTP/1.0 501 Tor is not an HTTP Proxy\r\n"
2170 "Content-Type: text/html; charset=iso-8859-1\r\n\r\n"
2171 "<html>\n"
2172 "<head>\n"
2173 "<title>Tor is not an HTTP Proxy</title>\n"
2174 "</head>\n"
2175 "<body>\n"
2176 "<h1>Tor is not an HTTP Proxy</h1>\n"
2177 "<p>\n"
2178 "It appears you have configured your web browser to use Tor as an HTTP proxy."
2179 "\n"
2180 "This is not correct: Tor is a SOCKS proxy, not an HTTP proxy.\n"
2181 "Please configure your client accordingly.\n"
2182 "</p>\n"
2183 "<p>\n"
2184 "See <a href=\"https://www.torproject.org/documentation.html\">"
2185            "https://www.torproject.org/documentation.html</a> for more "
2186            "information.\n"
2187 "<!-- Plus this comment, to make the body response more than 512 bytes, so "
2188 "     IE will be willing to display it. Comment comment comment comment "
2189 "     comment comment comment comment comment comment comment comment.-->\n"
2190 "</p>\n"
2191 "</body>\n"
2192 "</html>\n"
2193              , MAX_SOCKS_REPLY_LEN);
2194       req->replylen = strlen((char*)req->reply)+1;
2195       /* fall through */
2196     default: /* version is not socks4 or socks5 */
2197       log_warn(LD_APP,
2198                "Socks version %d not recognized. (Tor is not an http proxy.)",
2199                *(data));
2200       {
2201         /* Tell the controller the first 8 bytes. */
2202         char *tmp = tor_strndup(data, datalen < 8 ? datalen : 8);
2203         control_event_client_status(LOG_WARN,
2204                                     "SOCKS_UNKNOWN_PROTOCOL DATA=\"%s\"",
2205                                     escaped(tmp));
2206         tor_free(tmp);
2207       }
2208       return -1;
2209   }
2210 }
2211
2212 /** Inspect a reply from SOCKS server stored in <b>buf</b> according
2213  * to <b>state</b>, removing the protocol data upon success. Return 0 on
2214  * incomplete response, 1 on success and -1 on error, in which case
2215  * <b>reason</b> is set to a descriptive message (free() when finished
2216  * with it).
2217  *
2218  * As a special case, 2 is returned when user/pass is required
2219  * during SOCKS5 handshake and user/pass is configured.
2220  */
2221 int
2222 fetch_from_buf_socks_client(buf_t *buf, int state, char **reason)
2223 {
2224   ssize_t drain = 0;
2225   int r;
2226   if (buf->datalen < 2)
2227     return 0;
2228
2229   buf_pullup(buf, MAX_SOCKS_MESSAGE_LEN, 0);
2230   tor_assert(buf->head && buf->head->datalen >= 2);
2231
2232   r = parse_socks_client((uint8_t*)buf->head->data, buf->head->datalen,
2233                          state, reason, &drain);
2234   if (drain > 0)
2235     buf_remove_from_front(buf, drain);
2236   else if (drain < 0)
2237     buf_clear(buf);
2238
2239   return r;
2240 }
2241
2242 #ifdef USE_BUFFEREVENTS
2243 /** As fetch_from_buf_socks_client, buf works on an evbuffer */
2244 int
2245 fetch_from_evbuffer_socks_client(struct evbuffer *buf, int state,
2246                                  char **reason)
2247 {
2248   ssize_t drain = 0;
2249   uint8_t *data;
2250   size_t datalen;
2251   int r;
2252
2253   /* Linearize the SOCKS response in the buffer, up to 128 bytes.
2254    * (parse_socks_client shouldn't need to see anything beyond that.) */
2255   datalen = evbuffer_get_length(buf);
2256   if (datalen > MAX_SOCKS_MESSAGE_LEN)
2257     datalen = MAX_SOCKS_MESSAGE_LEN;
2258   data = evbuffer_pullup(buf, datalen);
2259
2260   r = parse_socks_client(data, datalen, state, reason, &drain);
2261   if (drain > 0)
2262     evbuffer_drain(buf, drain);
2263   else if (drain < 0)
2264     evbuffer_drain(buf, evbuffer_get_length(buf));
2265
2266   return r;
2267 }
2268 #endif
2269
2270 /** Implementation logic for fetch_from_*_socks_client. */
2271 static int
2272 parse_socks_client(const uint8_t *data, size_t datalen,
2273                    int state, char **reason,
2274                    ssize_t *drain_out)
2275 {
2276   unsigned int addrlen;
2277   *drain_out = 0;
2278   if (datalen < 2)
2279     return 0;
2280
2281   switch (state) {
2282     case PROXY_SOCKS4_WANT_CONNECT_OK:
2283       /* Wait for the complete response */
2284       if (datalen < 8)
2285         return 0;
2286
2287       if (data[1] != 0x5a) {
2288         *reason = tor_strdup(socks4_response_code_to_string(data[1]));
2289         return -1;
2290       }
2291
2292       /* Success */
2293       *drain_out = 8;
2294       return 1;
2295
2296     case PROXY_SOCKS5_WANT_AUTH_METHOD_NONE:
2297       /* we don't have any credentials */
2298       if (data[1] != 0x00) {
2299         *reason = tor_strdup("server doesn't support any of our "
2300                              "available authentication methods");
2301         return -1;
2302       }
2303
2304       log_info(LD_NET, "SOCKS 5 client: continuing without authentication");
2305       *drain_out = -1;
2306       return 1;
2307
2308     case PROXY_SOCKS5_WANT_AUTH_METHOD_RFC1929:
2309       /* we have a username and password. return 1 if we can proceed without
2310        * providing authentication, or 2 otherwise. */
2311       switch (data[1]) {
2312         case 0x00:
2313           log_info(LD_NET, "SOCKS 5 client: we have auth details but server "
2314                             "doesn't require authentication.");
2315           *drain_out = -1;
2316           return 1;
2317         case 0x02:
2318           log_info(LD_NET, "SOCKS 5 client: need authentication.");
2319           *drain_out = -1;
2320           return 2;
2321         /* fall through */
2322       }
2323
2324       *reason = tor_strdup("server doesn't support any of our available "
2325                            "authentication methods");
2326       return -1;
2327
2328     case PROXY_SOCKS5_WANT_AUTH_RFC1929_OK:
2329       /* handle server reply to rfc1929 authentication */
2330       if (data[1] != 0x00) {
2331         *reason = tor_strdup("authentication failed");
2332         return -1;
2333       }
2334
2335       log_info(LD_NET, "SOCKS 5 client: authentication successful.");
2336       *drain_out = -1;
2337       return 1;
2338
2339     case PROXY_SOCKS5_WANT_CONNECT_OK:
2340       /* response is variable length. BND.ADDR, etc, isn't needed
2341        * (don't bother with buf_pullup()), but make sure to eat all
2342        * the data used */
2343
2344       /* wait for address type field to arrive */
2345       if (datalen < 4)
2346         return 0;
2347
2348       switch (data[3]) {
2349         case 0x01: /* ip4 */
2350           addrlen = 4;
2351           break;
2352         case 0x04: /* ip6 */
2353           addrlen = 16;
2354           break;
2355         case 0x03: /* fqdn (can this happen here?) */
2356           if (datalen < 5)
2357             return 0;
2358           addrlen = 1 + data[4];
2359           break;
2360         default:
2361           *reason = tor_strdup("invalid response to connect request");
2362           return -1;
2363       }
2364
2365       /* wait for address and port */
2366       if (datalen < 6 + addrlen)
2367         return 0;
2368
2369       if (data[1] != 0x00) {
2370         *reason = tor_strdup(socks5_response_code_to_string(data[1]));
2371         return -1;
2372       }
2373
2374       *drain_out = 6 + addrlen;
2375       return 1;
2376   }
2377
2378   /* shouldn't get here... */
2379   tor_assert(0);
2380
2381   return -1;
2382 }
2383
2384 /** Return 1 iff buf looks more like it has an (obsolete) v0 controller
2385  * command on it than any valid v1 controller command. */
2386 int
2387 peek_buf_has_control0_command(buf_t *buf)
2388 {
2389   if (buf->datalen >= 4) {
2390     char header[4];
2391     uint16_t cmd;
2392     peek_from_buf(header, sizeof(header), buf);
2393     cmd = ntohs(get_uint16(header+2));
2394     if (cmd <= 0x14)
2395       return 1; /* This is definitely not a v1 control command. */
2396   }
2397   return 0;
2398 }
2399
2400 #ifdef USE_BUFFEREVENTS
2401 int
2402 peek_evbuffer_has_control0_command(struct evbuffer *buf)
2403 {
2404   int result = 0;
2405   if (evbuffer_get_length(buf) >= 4) {
2406     int free_out = 0;
2407     char *data = NULL;
2408     size_t n = inspect_evbuffer(buf, &data, 4, &free_out, NULL);
2409     uint16_t cmd;
2410     tor_assert(n >= 4);
2411     cmd = ntohs(get_uint16(data+2));
2412     if (cmd <= 0x14)
2413       result = 1;
2414     if (free_out)
2415       tor_free(data);
2416   }
2417   return result;
2418 }
2419 #endif
2420
2421 /** Return the index within <b>buf</b> at which <b>ch</b> first appears,
2422  * or -1 if <b>ch</b> does not appear on buf. */
2423 static off_t
2424 buf_find_offset_of_char(buf_t *buf, char ch)
2425 {
2426   chunk_t *chunk;
2427   off_t offset = 0;
2428   for (chunk = buf->head; chunk; chunk = chunk->next) {
2429     char *cp = memchr(chunk->data, ch, chunk->datalen);
2430     if (cp)
2431       return offset + (cp - chunk->data);
2432     else
2433       offset += chunk->datalen;
2434   }
2435   return -1;
2436 }
2437
2438 /** Try to read a single LF-terminated line from <b>buf</b>, and write it
2439  * (including the LF), NUL-terminated, into the *<b>data_len</b> byte buffer
2440  * at <b>data_out</b>.  Set *<b>data_len</b> to the number of bytes in the
2441  * line, not counting the terminating NUL.  Return 1 if we read a whole line,
2442  * return 0 if we don't have a whole line yet, and return -1 if the line
2443  * length exceeds *<b>data_len</b>.
2444  */
2445 int
2446 fetch_from_buf_line(buf_t *buf, char *data_out, size_t *data_len)
2447 {
2448   size_t sz;
2449   off_t offset;
2450
2451   if (!buf->head)
2452     return 0;
2453
2454   offset = buf_find_offset_of_char(buf, '\n');
2455   if (offset < 0)
2456     return 0;
2457   sz = (size_t) offset;
2458   if (sz+2 > *data_len) {
2459     *data_len = sz + 2;
2460     return -1;
2461   }
2462   fetch_from_buf(data_out, sz+1, buf);
2463   data_out[sz+1] = '\0';
2464   *data_len = sz+1;
2465   return 1;
2466 }
2467
2468 /** Compress on uncompress the <b>data_len</b> bytes in <b>data</b> using the
2469  * zlib state <b>state</b>, appending the result to <b>buf</b>.  If
2470  * <b>done</b> is true, flush the data in the state and finish the
2471  * compression/uncompression.  Return -1 on failure, 0 on success. */
2472 int
2473 write_to_buf_zlib(buf_t *buf, tor_zlib_state_t *state,
2474                   const char *data, size_t data_len,
2475                   int done)
2476 {
2477   char *next;
2478   size_t old_avail, avail;
2479   int over = 0;
2480
2481   do {
2482     int need_new_chunk = 0;
2483     if (!buf->tail || ! CHUNK_REMAINING_CAPACITY(buf->tail)) {
2484       size_t cap = data_len / 4;
2485       buf_add_chunk_with_capacity(buf, cap, 1);
2486     }
2487     next = CHUNK_WRITE_PTR(buf->tail);
2488     avail = old_avail = CHUNK_REMAINING_CAPACITY(buf->tail);
2489     switch (tor_zlib_process(state, &next, &avail, &data, &data_len, done)) {
2490       case TOR_ZLIB_DONE:
2491         over = 1;
2492         break;
2493       case TOR_ZLIB_ERR:
2494         return -1;
2495       case TOR_ZLIB_OK:
2496         if (data_len == 0)
2497           over = 1;
2498         break;
2499       case TOR_ZLIB_BUF_FULL:
2500         if (avail) {
2501           /* Zlib says we need more room (ZLIB_BUF_FULL).  Start a new chunk
2502            * automatically, whether were going to or not. */
2503           need_new_chunk = 1;
2504         }
2505         break;
2506     }
2507     buf->datalen += old_avail - avail;
2508     buf->tail->datalen += old_avail - avail;
2509     if (need_new_chunk) {
2510       buf_add_chunk_with_capacity(buf, data_len/4, 1);
2511     }
2512
2513   } while (!over);
2514   check();
2515   return 0;
2516 }
2517
2518 #ifdef USE_BUFFEREVENTS
2519 int
2520 write_to_evbuffer_zlib(struct evbuffer *buf, tor_zlib_state_t *state,
2521                        const char *data, size_t data_len,
2522                        int done)
2523 {
2524   char *next;
2525   size_t old_avail, avail;
2526   int over = 0, n;
2527   struct evbuffer_iovec vec[1];
2528   do {
2529     {
2530       size_t cap = data_len / 4;
2531       if (cap < 128)
2532         cap = 128;
2533       /* XXXX NM this strategy is fragmentation-prone. We should really have
2534        * two iovecs, and write first into the one, and then into the
2535        * second if the first gets full. */
2536       n = evbuffer_reserve_space(buf, cap, vec, 1);
2537       tor_assert(n == 1);
2538     }
2539
2540     next = vec[0].iov_base;
2541     avail = old_avail = vec[0].iov_len;
2542
2543     switch (tor_zlib_process(state, &next, &avail, &data, &data_len, done)) {
2544       case TOR_ZLIB_DONE:
2545         over = 1;
2546         break;
2547       case TOR_ZLIB_ERR:
2548         return -1;
2549       case TOR_ZLIB_OK:
2550         if (data_len == 0)
2551           over = 1;
2552         break;
2553       case TOR_ZLIB_BUF_FULL:
2554         if (avail) {
2555           /* Zlib says we need more room (ZLIB_BUF_FULL).  Start a new chunk
2556            * automatically, whether were going to or not. */
2557         }
2558         break;
2559     }
2560
2561     /* XXXX possible infinite loop on BUF_FULL. */
2562     vec[0].iov_len = old_avail - avail;
2563     evbuffer_commit_space(buf, vec, 1);
2564
2565   } while (!over);
2566   check();
2567   return 0;
2568 }
2569 #endif
2570
2571 /** Set *<b>output</b> to contain a copy of the data in *<b>input</b> */
2572 int
2573 generic_buffer_set_to_copy(generic_buffer_t **output,
2574                            const generic_buffer_t *input)
2575 {
2576 #ifdef USE_BUFFEREVENTS
2577   struct evbuffer_ptr ptr;
2578   size_t remaining = evbuffer_get_length(input);
2579   if (*output) {
2580     evbuffer_drain(*output, evbuffer_get_length(*output));
2581   } else {
2582     if (!(*output = evbuffer_new()))
2583       return -1;
2584   }
2585   evbuffer_ptr_set((struct evbuffer*)input, &ptr, 0, EVBUFFER_PTR_SET);
2586   while (remaining) {
2587     struct evbuffer_iovec v[4];
2588     int n_used, i;
2589     n_used = evbuffer_peek((struct evbuffer*)input, -1, &ptr, v, 4);
2590     if (n_used < 0)
2591       return -1;
2592     for (i=0;i<n_used;++i) {
2593       evbuffer_add(*output, v[i].iov_base, v[i].iov_len);
2594       tor_assert(v[i].iov_len <= remaining);
2595       remaining -= v[i].iov_len;
2596       evbuffer_ptr_set((struct evbuffer*)input,
2597                        &ptr, v[i].iov_len, EVBUFFER_PTR_ADD);
2598     }
2599   }
2600 #else
2601   if (*output)
2602     buf_free(*output);
2603   *output = buf_copy(input);
2604 #endif
2605   return 0;
2606 }
2607
2608 /** Log an error and exit if <b>buf</b> is corrupted.
2609  */
2610 void
2611 assert_buf_ok(buf_t *buf)
2612 {
2613   tor_assert(buf);
2614   tor_assert(buf->magic == BUFFER_MAGIC);
2615
2616   if (! buf->head) {
2617     tor_assert(!buf->tail);
2618     tor_assert(buf->datalen == 0);
2619   } else {
2620     chunk_t *ch;
2621     size_t total = 0;
2622     tor_assert(buf->tail);
2623     for (ch = buf->head; ch; ch = ch->next) {
2624       total += ch->datalen;
2625       tor_assert(ch->datalen <= ch->memlen);
2626       tor_assert(ch->data >= &ch->mem[0]);
2627       tor_assert(ch->data < &ch->mem[0]+ch->memlen);
2628       tor_assert(ch->data+ch->datalen <= &ch->mem[0] + ch->memlen);
2629       if (!ch->next)
2630         tor_assert(ch == buf->tail);
2631     }
2632     tor_assert(buf->datalen == total);
2633   }
2634 }
2635
2636 #ifdef ENABLE_BUF_FREELISTS
2637 /** Log an error and exit if <b>fl</b> is corrupted.
2638  */
2639 static void
2640 assert_freelist_ok(chunk_freelist_t *fl)
2641 {
2642   chunk_t *ch;
2643   int n;
2644   tor_assert(fl->alloc_size > 0);
2645   n = 0;
2646   for (ch = fl->head; ch; ch = ch->next) {
2647     tor_assert(CHUNK_ALLOC_SIZE(ch->memlen) == fl->alloc_size);
2648     ++n;
2649   }
2650   tor_assert(n == fl->cur_length);
2651   tor_assert(n >= fl->lowest_length);
2652   tor_assert(n <= fl->max_length);
2653 }
2654 #endif
2655