Merge remote branch 'origin/maint-0.2.1'
[tor.git] / src / or / main.c
blobf33dc2f6b4f0c4a6dfd3c0d81051ecdec0228314
1 /* Copyright (c) 2001 Matej Pfajfar.
2 * Copyright (c) 2001-2004, Roger Dingledine.
3 * Copyright (c) 2004-2006, Roger Dingledine, Nick Mathewson.
4 * Copyright (c) 2007-2010, The Tor Project, Inc. */
5 /* See LICENSE for licensing information */
7 /**
8 * \file main.c
9 * \brief Toplevel module. Handles signals, multiplexes between
10 * connections, implements main loop, and drives scheduled events.
11 **/
13 #define MAIN_PRIVATE
14 #include "or.h"
15 #include "buffers.h"
16 #include "circuitbuild.h"
17 #include "circuitlist.h"
18 #include "circuituse.h"
19 #include "command.h"
20 #include "config.h"
21 #include "connection.h"
22 #include "connection_edge.h"
23 #include "connection_or.h"
24 #include "control.h"
25 #include "cpuworker.h"
26 #include "directory.h"
27 #include "dirserv.h"
28 #include "dirvote.h"
29 #include "dns.h"
30 #include "dnsserv.h"
31 #include "geoip.h"
32 #include "hibernate.h"
33 #include "main.h"
34 #include "microdesc.h"
35 #include "networkstatus.h"
36 #include "ntmain.h"
37 #include "onion.h"
38 #include "policies.h"
39 #include "relay.h"
40 #include "rendclient.h"
41 #include "rendcommon.h"
42 #include "rendservice.h"
43 #include "rephist.h"
44 #include "router.h"
45 #include "routerlist.h"
46 #include "routerparse.h"
47 #ifdef USE_DMALLOC
48 #include <dmalloc.h>
49 #include <openssl/crypto.h>
50 #endif
51 #include "memarea.h"
53 #ifdef HAVE_EVENT2_EVENT_H
54 #include <event2/event.h>
55 #else
56 #include <event.h>
57 #endif
59 void evdns_shutdown(int);
61 /********* PROTOTYPES **********/
63 static void dumpmemusage(int severity);
64 static void dumpstats(int severity); /* log stats */
65 static void conn_read_callback(int fd, short event, void *_conn);
66 static void conn_write_callback(int fd, short event, void *_conn);
67 static void signal_callback(int fd, short events, void *arg);
68 static void second_elapsed_callback(periodic_timer_t *timer, void *args);
69 static int conn_close_if_marked(int i);
70 static void connection_start_reading_from_linked_conn(connection_t *conn);
71 static int connection_should_read_from_linked_conn(connection_t *conn);
73 /********* START VARIABLES **********/
75 int global_read_bucket; /**< Max number of bytes I can read this second. */
76 int global_write_bucket; /**< Max number of bytes I can write this second. */
78 /** Max number of relayed (bandwidth class 1) bytes I can read this second. */
79 int global_relayed_read_bucket;
80 /** Max number of relayed (bandwidth class 1) bytes I can write this second. */
81 int global_relayed_write_bucket;
83 /** What was the read bucket before the last second_elapsed_callback() call?
84 * (used to determine how many bytes we've read). */
85 static int stats_prev_global_read_bucket;
86 /** What was the write bucket before the last second_elapsed_callback() call?
87 * (used to determine how many bytes we've written). */
88 static int stats_prev_global_write_bucket;
89 /* XXX we might want to keep stats about global_relayed_*_bucket too. Or not.*/
90 /** How many bytes have we read since we started the process? */
91 static uint64_t stats_n_bytes_read = 0;
92 /** How many bytes have we written since we started the process? */
93 static uint64_t stats_n_bytes_written = 0;
94 /** What time did this process start up? */
95 time_t time_of_process_start = 0;
96 /** How many seconds have we been running? */
97 long stats_n_seconds_working = 0;
98 /** When do we next launch DNS wildcarding checks? */
99 static time_t time_to_check_for_correct_dns = 0;
101 /** How often will we honor SIGNEWNYM requests? */
102 #define MAX_SIGNEWNYM_RATE 10
103 /** When did we last process a SIGNEWNYM request? */
104 static time_t time_of_last_signewnym = 0;
105 /** Is there a signewnym request we're currently waiting to handle? */
106 static int signewnym_is_pending = 0;
108 /** Smartlist of all open connections. */
109 static smartlist_t *connection_array = NULL;
110 /** List of connections that have been marked for close and need to be freed
111 * and removed from connection_array. */
112 static smartlist_t *closeable_connection_lst = NULL;
113 /** List of linked connections that are currently reading data into their
114 * inbuf from their partner's outbuf. */
115 static smartlist_t *active_linked_connection_lst = NULL;
116 /** Flag: Set to true iff we entered the current libevent main loop via
117 * <b>loop_once</b>. If so, there's no need to trigger a loopexit in order
118 * to handle linked connections. */
119 static int called_loop_once = 0;
121 /** We set this to 1 when we've opened a circuit, so we can print a log
122 * entry to inform the user that Tor is working. */
123 int has_completed_circuit=0;
125 /** How often do we check for router descriptors that we should download
126 * when we have too little directory info? */
127 #define GREEDY_DESCRIPTOR_RETRY_INTERVAL (10)
128 /** How often do we check for router descriptors that we should download
129 * when we have enough directory info? */
130 #define LAZY_DESCRIPTOR_RETRY_INTERVAL (60)
131 /** How often do we 'forgive' undownloadable router descriptors and attempt
132 * to download them again? */
133 #define DESCRIPTOR_FAILURE_RESET_INTERVAL (60*60)
134 /** How long do we let a directory connection stall before expiring it? */
135 #define DIR_CONN_MAX_STALL (5*60)
137 /** How long do we let OR connections handshake before we decide that
138 * they are obsolete? */
139 #define TLS_HANDSHAKE_TIMEOUT (60)
141 /********* END VARIABLES ************/
143 /****************************************************************************
145 * This section contains accessors and other methods on the connection_array
146 * variables (which are global within this file and unavailable outside it).
148 ****************************************************************************/
150 /** Add <b>conn</b> to the array of connections that we can poll on. The
151 * connection's socket must be set; the connection starts out
152 * non-reading and non-writing.
155 connection_add(connection_t *conn)
157 tor_assert(conn);
158 tor_assert(conn->s >= 0 ||
159 conn->linked ||
160 (conn->type == CONN_TYPE_AP &&
161 TO_EDGE_CONN(conn)->is_dns_request));
163 tor_assert(conn->conn_array_index == -1); /* can only connection_add once */
164 conn->conn_array_index = smartlist_len(connection_array);
165 smartlist_add(connection_array, conn);
167 if (conn->s >= 0 || conn->linked) {
168 conn->read_event = tor_event_new(tor_libevent_get_base(),
169 conn->s, EV_READ|EV_PERSIST, conn_read_callback, conn);
170 conn->write_event = tor_event_new(tor_libevent_get_base(),
171 conn->s, EV_WRITE|EV_PERSIST, conn_write_callback, conn);
174 log_debug(LD_NET,"new conn type %s, socket %d, address %s, n_conns %d.",
175 conn_type_to_string(conn->type), conn->s, conn->address,
176 smartlist_len(connection_array));
178 return 0;
181 /** Tell libevent that we don't care about <b>conn</b> any more. */
182 void
183 connection_unregister_events(connection_t *conn)
185 if (conn->read_event) {
186 if (event_del(conn->read_event))
187 log_warn(LD_BUG, "Error removing read event for %d", conn->s);
188 tor_free(conn->read_event);
190 if (conn->write_event) {
191 if (event_del(conn->write_event))
192 log_warn(LD_BUG, "Error removing write event for %d", conn->s);
193 tor_free(conn->write_event);
195 if (conn->dns_server_port) {
196 dnsserv_close_listener(conn);
200 /** Remove the connection from the global list, and remove the
201 * corresponding poll entry. Calling this function will shift the last
202 * connection (if any) into the position occupied by conn.
205 connection_remove(connection_t *conn)
207 int current_index;
208 connection_t *tmp;
210 tor_assert(conn);
212 log_debug(LD_NET,"removing socket %d (type %s), n_conns now %d",
213 conn->s, conn_type_to_string(conn->type),
214 smartlist_len(connection_array));
216 tor_assert(conn->conn_array_index >= 0);
217 current_index = conn->conn_array_index;
218 connection_unregister_events(conn); /* This is redundant, but cheap. */
219 if (current_index == smartlist_len(connection_array)-1) { /* at the end */
220 smartlist_del(connection_array, current_index);
221 return 0;
224 /* replace this one with the one at the end */
225 smartlist_del(connection_array, current_index);
226 tmp = smartlist_get(connection_array, current_index);
227 tmp->conn_array_index = current_index;
229 return 0;
232 /** If <b>conn</b> is an edge conn, remove it from the list
233 * of conn's on this circuit. If it's not on an edge,
234 * flush and send destroys for all circuits on this conn.
236 * Remove it from connection_array (if applicable) and
237 * from closeable_connection_list.
239 * Then free it.
241 static void
242 connection_unlink(connection_t *conn)
244 connection_about_to_close_connection(conn);
245 if (conn->conn_array_index >= 0) {
246 connection_remove(conn);
248 if (conn->linked_conn) {
249 conn->linked_conn->linked_conn = NULL;
250 if (! conn->linked_conn->marked_for_close &&
251 conn->linked_conn->reading_from_linked_conn)
252 connection_start_reading(conn->linked_conn);
253 conn->linked_conn = NULL;
255 smartlist_remove(closeable_connection_lst, conn);
256 smartlist_remove(active_linked_connection_lst, conn);
257 if (conn->type == CONN_TYPE_EXIT) {
258 assert_connection_edge_not_dns_pending(TO_EDGE_CONN(conn));
260 if (conn->type == CONN_TYPE_OR) {
261 if (!tor_digest_is_zero(TO_OR_CONN(conn)->identity_digest))
262 connection_or_remove_from_identity_map(TO_OR_CONN(conn));
264 connection_free(conn);
267 /** Schedule <b>conn</b> to be closed. **/
268 void
269 add_connection_to_closeable_list(connection_t *conn)
271 tor_assert(!smartlist_isin(closeable_connection_lst, conn));
272 tor_assert(conn->marked_for_close);
273 assert_connection_ok(conn, time(NULL));
274 smartlist_add(closeable_connection_lst, conn);
277 /** Return 1 if conn is on the closeable list, else return 0. */
279 connection_is_on_closeable_list(connection_t *conn)
281 return smartlist_isin(closeable_connection_lst, conn);
284 /** Return true iff conn is in the current poll array. */
286 connection_in_array(connection_t *conn)
288 return smartlist_isin(connection_array, conn);
291 /** Set <b>*array</b> to an array of all connections, and <b>*n</b>
292 * to the length of the array. <b>*array</b> and <b>*n</b> must not
293 * be modified.
295 smartlist_t *
296 get_connection_array(void)
298 if (!connection_array)
299 connection_array = smartlist_create();
300 return connection_array;
303 /** Set the event mask on <b>conn</b> to <b>events</b>. (The event
304 * mask is a bitmask whose bits are READ_EVENT and WRITE_EVENT)
306 void
307 connection_watch_events(connection_t *conn, watchable_events_t events)
309 if (events & READ_EVENT)
310 connection_start_reading(conn);
311 else
312 connection_stop_reading(conn);
314 if (events & WRITE_EVENT)
315 connection_start_writing(conn);
316 else
317 connection_stop_writing(conn);
320 /** Return true iff <b>conn</b> is listening for read events. */
322 connection_is_reading(connection_t *conn)
324 tor_assert(conn);
326 return conn->reading_from_linked_conn ||
327 (conn->read_event && event_pending(conn->read_event, EV_READ, NULL));
330 /** Tell the main loop to stop notifying <b>conn</b> of any read events. */
331 void
332 connection_stop_reading(connection_t *conn)
334 tor_assert(conn);
335 tor_assert(conn->read_event);
337 if (conn->linked) {
338 conn->reading_from_linked_conn = 0;
339 connection_stop_reading_from_linked_conn(conn);
340 } else {
341 if (event_del(conn->read_event))
342 log_warn(LD_NET, "Error from libevent setting read event state for %d "
343 "to unwatched: %s",
344 conn->s,
345 tor_socket_strerror(tor_socket_errno(conn->s)));
349 /** Tell the main loop to start notifying <b>conn</b> of any read events. */
350 void
351 connection_start_reading(connection_t *conn)
353 tor_assert(conn);
354 tor_assert(conn->read_event);
356 if (conn->linked) {
357 conn->reading_from_linked_conn = 1;
358 if (connection_should_read_from_linked_conn(conn))
359 connection_start_reading_from_linked_conn(conn);
360 } else {
361 if (event_add(conn->read_event, NULL))
362 log_warn(LD_NET, "Error from libevent setting read event state for %d "
363 "to watched: %s",
364 conn->s,
365 tor_socket_strerror(tor_socket_errno(conn->s)));
369 /** Return true iff <b>conn</b> is listening for write events. */
371 connection_is_writing(connection_t *conn)
373 tor_assert(conn);
375 return conn->writing_to_linked_conn ||
376 (conn->write_event && event_pending(conn->write_event, EV_WRITE, NULL));
379 /** Tell the main loop to stop notifying <b>conn</b> of any write events. */
380 void
381 connection_stop_writing(connection_t *conn)
383 tor_assert(conn);
384 tor_assert(conn->write_event);
386 if (conn->linked) {
387 conn->writing_to_linked_conn = 0;
388 if (conn->linked_conn)
389 connection_stop_reading_from_linked_conn(conn->linked_conn);
390 } else {
391 if (event_del(conn->write_event))
392 log_warn(LD_NET, "Error from libevent setting write event state for %d "
393 "to unwatched: %s",
394 conn->s,
395 tor_socket_strerror(tor_socket_errno(conn->s)));
399 /** Tell the main loop to start notifying <b>conn</b> of any write events. */
400 void
401 connection_start_writing(connection_t *conn)
403 tor_assert(conn);
404 tor_assert(conn->write_event);
406 if (conn->linked) {
407 conn->writing_to_linked_conn = 1;
408 if (conn->linked_conn &&
409 connection_should_read_from_linked_conn(conn->linked_conn))
410 connection_start_reading_from_linked_conn(conn->linked_conn);
411 } else {
412 if (event_add(conn->write_event, NULL))
413 log_warn(LD_NET, "Error from libevent setting write event state for %d "
414 "to watched: %s",
415 conn->s,
416 tor_socket_strerror(tor_socket_errno(conn->s)));
420 /** Return true iff <b>conn</b> is linked conn, and reading from the conn
421 * linked to it would be good and feasible. (Reading is "feasible" if the
422 * other conn exists and has data in its outbuf, and is "good" if we have our
423 * reading_from_linked_conn flag set and the other conn has its
424 * writing_to_linked_conn flag set.)*/
425 static int
426 connection_should_read_from_linked_conn(connection_t *conn)
428 if (conn->linked && conn->reading_from_linked_conn) {
429 if (! conn->linked_conn ||
430 (conn->linked_conn->writing_to_linked_conn &&
431 buf_datalen(conn->linked_conn->outbuf)))
432 return 1;
434 return 0;
437 /** Helper: Tell the main loop to begin reading bytes into <b>conn</b> from
438 * its linked connection, if it is not doing so already. Called by
439 * connection_start_reading and connection_start_writing as appropriate. */
440 static void
441 connection_start_reading_from_linked_conn(connection_t *conn)
443 tor_assert(conn);
444 tor_assert(conn->linked == 1);
446 if (!conn->active_on_link) {
447 conn->active_on_link = 1;
448 smartlist_add(active_linked_connection_lst, conn);
449 if (!called_loop_once) {
450 /* This is the first event on the list; we won't be in LOOP_ONCE mode,
451 * so we need to make sure that the event_base_loop() actually exits at
452 * the end of its run through the current connections and lets us
453 * activate read events for linked connections. */
454 struct timeval tv = { 0, 0 };
455 tor_event_base_loopexit(tor_libevent_get_base(), &tv);
457 } else {
458 tor_assert(smartlist_isin(active_linked_connection_lst, conn));
462 /** Tell the main loop to stop reading bytes into <b>conn</b> from its linked
463 * connection, if is currently doing so. Called by connection_stop_reading,
464 * connection_stop_writing, and connection_read. */
465 void
466 connection_stop_reading_from_linked_conn(connection_t *conn)
468 tor_assert(conn);
469 tor_assert(conn->linked == 1);
471 if (conn->active_on_link) {
472 conn->active_on_link = 0;
473 /* FFFF We could keep an index here so we can smartlist_del
474 * cleanly. On the other hand, this doesn't show up on profiles,
475 * so let's leave it alone for now. */
476 smartlist_remove(active_linked_connection_lst, conn);
477 } else {
478 tor_assert(!smartlist_isin(active_linked_connection_lst, conn));
482 /** Close all connections that have been scheduled to get closed. */
483 static void
484 close_closeable_connections(void)
486 int i;
487 for (i = 0; i < smartlist_len(closeable_connection_lst); ) {
488 connection_t *conn = smartlist_get(closeable_connection_lst, i);
489 if (conn->conn_array_index < 0) {
490 connection_unlink(conn); /* blow it away right now */
491 } else {
492 if (!conn_close_if_marked(conn->conn_array_index))
493 ++i;
498 /** Libevent callback: this gets invoked when (connection_t*)<b>conn</b> has
499 * some data to read. */
500 static void
501 conn_read_callback(int fd, short event, void *_conn)
503 connection_t *conn = _conn;
504 (void)fd;
505 (void)event;
507 log_debug(LD_NET,"socket %d wants to read.",conn->s);
509 /* assert_connection_ok(conn, time(NULL)); */
511 if (connection_handle_read(conn) < 0) {
512 if (!conn->marked_for_close) {
513 #ifndef MS_WINDOWS
514 log_warn(LD_BUG,"Unhandled error on read for %s connection "
515 "(fd %d); removing",
516 conn_type_to_string(conn->type), conn->s);
517 tor_fragile_assert();
518 #endif
519 if (CONN_IS_EDGE(conn))
520 connection_edge_end_errno(TO_EDGE_CONN(conn));
521 connection_mark_for_close(conn);
524 assert_connection_ok(conn, time(NULL));
526 if (smartlist_len(closeable_connection_lst))
527 close_closeable_connections();
530 /** Libevent callback: this gets invoked when (connection_t*)<b>conn</b> has
531 * some data to write. */
532 static void
533 conn_write_callback(int fd, short events, void *_conn)
535 connection_t *conn = _conn;
536 (void)fd;
537 (void)events;
539 LOG_FN_CONN(conn, (LOG_DEBUG, LD_NET, "socket %d wants to write.",conn->s));
541 /* assert_connection_ok(conn, time(NULL)); */
543 if (connection_handle_write(conn, 0) < 0) {
544 if (!conn->marked_for_close) {
545 /* this connection is broken. remove it. */
546 log_fn(LOG_WARN,LD_BUG,
547 "unhandled error on write for %s connection (fd %d); removing",
548 conn_type_to_string(conn->type), conn->s);
549 tor_fragile_assert();
550 if (CONN_IS_EDGE(conn)) {
551 /* otherwise we cry wolf about duplicate close */
552 edge_connection_t *edge_conn = TO_EDGE_CONN(conn);
553 if (!edge_conn->end_reason)
554 edge_conn->end_reason = END_STREAM_REASON_INTERNAL;
555 edge_conn->edge_has_sent_end = 1;
557 connection_close_immediate(conn); /* So we don't try to flush. */
558 connection_mark_for_close(conn);
561 assert_connection_ok(conn, time(NULL));
563 if (smartlist_len(closeable_connection_lst))
564 close_closeable_connections();
567 /** If the connection at connection_array[i] is marked for close, then:
568 * - If it has data that it wants to flush, try to flush it.
569 * - If it _still_ has data to flush, and conn->hold_open_until_flushed is
570 * true, then leave the connection open and return.
571 * - Otherwise, remove the connection from connection_array and from
572 * all other lists, close it, and free it.
573 * Returns 1 if the connection was closed, 0 otherwise.
575 static int
576 conn_close_if_marked(int i)
578 connection_t *conn;
579 int retval;
580 time_t now;
582 conn = smartlist_get(connection_array, i);
583 if (!conn->marked_for_close)
584 return 0; /* nothing to see here, move along */
585 now = time(NULL);
586 assert_connection_ok(conn, now);
587 /* assert_all_pending_dns_resolves_ok(); */
589 log_debug(LD_NET,"Cleaning up connection (fd %d).",conn->s);
590 if ((conn->s >= 0 || conn->linked_conn) && connection_wants_to_flush(conn)) {
591 /* s == -1 means it's an incomplete edge connection, or that the socket
592 * has already been closed as unflushable. */
593 ssize_t sz = connection_bucket_write_limit(conn, now);
594 if (!conn->hold_open_until_flushed)
595 log_info(LD_NET,
596 "Conn (addr %s, fd %d, type %s, state %d) marked, but wants "
597 "to flush %d bytes. (Marked at %s:%d)",
598 escaped_safe_str_client(conn->address),
599 conn->s, conn_type_to_string(conn->type), conn->state,
600 (int)conn->outbuf_flushlen,
601 conn->marked_for_close_file, conn->marked_for_close);
602 if (conn->linked_conn) {
603 retval = move_buf_to_buf(conn->linked_conn->inbuf, conn->outbuf,
604 &conn->outbuf_flushlen);
605 if (retval >= 0) {
606 /* The linked conn will notice that it has data when it notices that
607 * we're gone. */
608 connection_start_reading_from_linked_conn(conn->linked_conn);
610 log_debug(LD_GENERAL, "Flushed last %d bytes from a linked conn; "
611 "%d left; flushlen %d; wants-to-flush==%d", retval,
612 (int)buf_datalen(conn->outbuf),
613 (int)conn->outbuf_flushlen,
614 connection_wants_to_flush(conn));
615 } else if (connection_speaks_cells(conn)) {
616 if (conn->state == OR_CONN_STATE_OPEN) {
617 retval = flush_buf_tls(TO_OR_CONN(conn)->tls, conn->outbuf, sz,
618 &conn->outbuf_flushlen);
619 } else
620 retval = -1; /* never flush non-open broken tls connections */
621 } else {
622 retval = flush_buf(conn->s, conn->outbuf, sz, &conn->outbuf_flushlen);
624 if (retval >= 0 && /* Technically, we could survive things like
625 TLS_WANT_WRITE here. But don't bother for now. */
626 conn->hold_open_until_flushed && connection_wants_to_flush(conn)) {
627 if (retval > 0) {
628 LOG_FN_CONN(conn, (LOG_INFO,LD_NET,
629 "Holding conn (fd %d) open for more flushing.",
630 conn->s));
631 conn->timestamp_lastwritten = now; /* reset so we can flush more */
633 return 0;
635 if (connection_wants_to_flush(conn)) {
636 int severity;
637 if (conn->type == CONN_TYPE_EXIT ||
638 (conn->type == CONN_TYPE_OR && server_mode(get_options())) ||
639 (conn->type == CONN_TYPE_DIR && conn->purpose == DIR_PURPOSE_SERVER))
640 severity = LOG_INFO;
641 else
642 severity = LOG_NOTICE;
643 /* XXXX Maybe allow this to happen a certain amount per hour; it usually
644 * is meaningless. */
645 log_fn(severity, LD_NET, "We stalled too much while trying to write %d "
646 "bytes to address %s. If this happens a lot, either "
647 "something is wrong with your network connection, or "
648 "something is wrong with theirs. "
649 "(fd %d, type %s, state %d, marked at %s:%d).",
650 (int)buf_datalen(conn->outbuf),
651 escaped_safe_str_client(conn->address),
652 conn->s, conn_type_to_string(conn->type), conn->state,
653 conn->marked_for_close_file,
654 conn->marked_for_close);
657 connection_unlink(conn); /* unlink, remove, free */
658 return 1;
661 /** We've just tried every dirserver we know about, and none of
662 * them were reachable. Assume the network is down. Change state
663 * so next time an application connection arrives we'll delay it
664 * and try another directory fetch. Kill off all the circuit_wait
665 * streams that are waiting now, since they will all timeout anyway.
667 void
668 directory_all_unreachable(time_t now)
670 connection_t *conn;
671 (void)now;
673 stats_n_seconds_working=0; /* reset it */
675 while ((conn = connection_get_by_type_state(CONN_TYPE_AP,
676 AP_CONN_STATE_CIRCUIT_WAIT))) {
677 edge_connection_t *edge_conn = TO_EDGE_CONN(conn);
678 log_notice(LD_NET,
679 "Is your network connection down? "
680 "Failing connection to '%s:%d'.",
681 safe_str_client(edge_conn->socks_request->address),
682 edge_conn->socks_request->port);
683 connection_mark_unattached_ap(edge_conn,
684 END_STREAM_REASON_NET_UNREACHABLE);
686 control_event_general_status(LOG_ERR, "DIR_ALL_UNREACHABLE");
689 /** This function is called whenever we successfully pull down some new
690 * network statuses or server descriptors. */
691 void
692 directory_info_has_arrived(time_t now, int from_cache)
694 or_options_t *options = get_options();
696 if (!router_have_minimum_dir_info()) {
697 int quiet = directory_too_idle_to_fetch_descriptors(options, now);
698 log(quiet ? LOG_INFO : LOG_NOTICE, LD_DIR,
699 "I learned some more directory information, but not enough to "
700 "build a circuit: %s", get_dir_info_status_string());
701 update_router_descriptor_downloads(now);
702 return;
703 } else {
704 if (directory_fetches_from_authorities(options))
705 update_router_descriptor_downloads(now);
707 /* if we have enough dir info, then update our guard status with
708 * whatever we just learned. */
709 entry_guards_compute_status();
710 /* Don't even bother trying to get extrainfo until the rest of our
711 * directory info is up-to-date */
712 if (options->DownloadExtraInfo)
713 update_extrainfo_downloads(now);
716 if (server_mode(options) && !we_are_hibernating() && !from_cache &&
717 (has_completed_circuit || !any_predicted_circuits(now)))
718 consider_testing_reachability(1, 1);
721 /** How long do we wait before killing OR connections with no circuits?
722 * In Tor versions up to 0.2.1.25 and 0.2.2.12-alpha, we waited 15 minutes
723 * before cancelling these connections, which caused fast relays to accrue
724 * many many idle connections. Hopefully 3 minutes is low enough that
725 * it kills most idle connections, without being so low that we cause
726 * clients to bounce on and off.
728 #define IDLE_OR_CONN_TIMEOUT 180
730 /** Perform regular maintenance tasks for a single connection. This
731 * function gets run once per second per connection by run_scheduled_events.
733 static void
734 run_connection_housekeeping(int i, time_t now)
736 cell_t cell;
737 connection_t *conn = smartlist_get(connection_array, i);
738 or_options_t *options = get_options();
739 or_connection_t *or_conn;
740 int past_keepalive =
741 now >= conn->timestamp_lastwritten + options->KeepalivePeriod;
743 if (conn->outbuf && !buf_datalen(conn->outbuf) && conn->type == CONN_TYPE_OR)
744 TO_OR_CONN(conn)->timestamp_lastempty = now;
746 if (conn->marked_for_close) {
747 /* nothing to do here */
748 return;
751 /* Expire any directory connections that haven't been active (sent
752 * if a server or received if a client) for 5 min */
753 if (conn->type == CONN_TYPE_DIR &&
754 ((DIR_CONN_IS_SERVER(conn) &&
755 conn->timestamp_lastwritten + DIR_CONN_MAX_STALL < now) ||
756 (!DIR_CONN_IS_SERVER(conn) &&
757 conn->timestamp_lastread + DIR_CONN_MAX_STALL < now))) {
758 log_info(LD_DIR,"Expiring wedged directory conn (fd %d, purpose %d)",
759 conn->s, conn->purpose);
760 /* This check is temporary; it's to let us know whether we should consider
761 * parsing partial serverdesc responses. */
762 if (conn->purpose == DIR_PURPOSE_FETCH_SERVERDESC &&
763 buf_datalen(conn->inbuf)>=1024) {
764 log_info(LD_DIR,"Trying to extract information from wedged server desc "
765 "download.");
766 connection_dir_reached_eof(TO_DIR_CONN(conn));
767 } else {
768 connection_mark_for_close(conn);
770 return;
773 if (!connection_speaks_cells(conn))
774 return; /* we're all done here, the rest is just for OR conns */
776 /* If we haven't written to an OR connection for a while, then either nuke
777 the connection or send a keepalive, depending. */
779 or_conn = TO_OR_CONN(conn);
780 tor_assert(conn->outbuf);
782 if (or_conn->is_bad_for_new_circs && !or_conn->n_circuits) {
783 /* It's bad for new circuits, and has no unmarked circuits on it:
784 * mark it now. */
785 log_info(LD_OR,
786 "Expiring non-used OR connection to fd %d (%s:%d) [Too old].",
787 conn->s, conn->address, conn->port);
788 if (conn->state == OR_CONN_STATE_CONNECTING)
789 connection_or_connect_failed(TO_OR_CONN(conn),
790 END_OR_CONN_REASON_TIMEOUT,
791 "Tor gave up on the connection");
792 connection_mark_for_close(conn);
793 conn->hold_open_until_flushed = 1;
794 } else if (!connection_state_is_open(conn)) {
795 if (past_keepalive) {
796 /* We never managed to actually get this connection open and happy. */
797 log_info(LD_OR,"Expiring non-open OR connection to fd %d (%s:%d).",
798 conn->s,conn->address, conn->port);
799 connection_mark_for_close(conn);
801 } else if (we_are_hibernating() && !or_conn->n_circuits &&
802 !buf_datalen(conn->outbuf)) {
803 /* We're hibernating, there's no circuits, and nothing to flush.*/
804 log_info(LD_OR,"Expiring non-used OR connection to fd %d (%s:%d) "
805 "[Hibernating or exiting].",
806 conn->s,conn->address, conn->port);
807 connection_mark_for_close(conn);
808 conn->hold_open_until_flushed = 1;
809 } else if (!or_conn->n_circuits &&
810 now >= or_conn->timestamp_last_added_nonpadding +
811 IDLE_OR_CONN_TIMEOUT) {
812 log_info(LD_OR,"Expiring non-used OR connection to fd %d (%s:%d) "
813 "[idle %d].", conn->s,conn->address, conn->port,
814 (int)(now - or_conn->timestamp_last_added_nonpadding));
815 connection_mark_for_close(conn);
816 conn->hold_open_until_flushed = 1;
817 } else if (
818 now >= or_conn->timestamp_lastempty + options->KeepalivePeriod*10 &&
819 now >= conn->timestamp_lastwritten + options->KeepalivePeriod*10) {
820 log_fn(LOG_PROTOCOL_WARN,LD_PROTOCOL,
821 "Expiring stuck OR connection to fd %d (%s:%d). (%d bytes to "
822 "flush; %d seconds since last write)",
823 conn->s, conn->address, conn->port,
824 (int)buf_datalen(conn->outbuf),
825 (int)(now-conn->timestamp_lastwritten));
826 connection_mark_for_close(conn);
827 } else if (past_keepalive && !buf_datalen(conn->outbuf)) {
828 /* send a padding cell */
829 log_fn(LOG_DEBUG,LD_OR,"Sending keepalive to (%s:%d)",
830 conn->address, conn->port);
831 memset(&cell,0,sizeof(cell_t));
832 cell.command = CELL_PADDING;
833 connection_or_write_cell_to_buf(&cell, or_conn);
837 /** Honor a NEWNYM request: make future requests unlinkable to past
838 * requests. */
839 static void
840 signewnym_impl(time_t now)
842 circuit_expire_all_dirty_circs();
843 addressmap_clear_transient();
844 time_of_last_signewnym = now;
845 signewnym_is_pending = 0;
848 /** Perform regular maintenance tasks. This function gets run once per
849 * second by second_elapsed_callback().
851 static void
852 run_scheduled_events(time_t now)
854 static time_t last_rotated_x509_certificate = 0;
855 static time_t time_to_check_v3_certificate = 0;
856 static time_t time_to_check_listeners = 0;
857 static time_t time_to_check_descriptor = 0;
858 static time_t time_to_check_ipaddress = 0;
859 static time_t time_to_shrink_memory = 0;
860 static time_t time_to_try_getting_descriptors = 0;
861 static time_t time_to_reset_descriptor_failures = 0;
862 static time_t time_to_add_entropy = 0;
863 static time_t time_to_write_bridge_status_file = 0;
864 static time_t time_to_downrate_stability = 0;
865 static time_t time_to_save_stability = 0;
866 static time_t time_to_clean_caches = 0;
867 static time_t time_to_recheck_bandwidth = 0;
868 static time_t time_to_check_for_expired_networkstatus = 0;
869 static time_t time_to_write_stats_files = 0;
870 static time_t time_to_write_bridge_stats = 0;
871 static int should_init_bridge_stats = 1;
872 static time_t time_to_retry_dns_init = 0;
873 or_options_t *options = get_options();
874 int i;
875 int have_dir_info;
877 /** 0. See if we've been asked to shut down and our timeout has
878 * expired; or if our bandwidth limits are exhausted and we
879 * should hibernate; or if it's time to wake up from hibernation.
881 consider_hibernation(now);
883 /* 0b. If we've deferred a signewnym, make sure it gets handled
884 * eventually. */
885 if (signewnym_is_pending &&
886 time_of_last_signewnym + MAX_SIGNEWNYM_RATE <= now) {
887 log(LOG_INFO, LD_CONTROL, "Honoring delayed NEWNYM request");
888 signewnym_impl(now);
891 /** 1a. Every MIN_ONION_KEY_LIFETIME seconds, rotate the onion keys,
892 * shut down and restart all cpuworkers, and update the directory if
893 * necessary.
895 if (server_mode(options) &&
896 get_onion_key_set_at()+MIN_ONION_KEY_LIFETIME < now) {
897 log_info(LD_GENERAL,"Rotating onion key.");
898 rotate_onion_key();
899 cpuworkers_rotate();
900 if (router_rebuild_descriptor(1)<0) {
901 log_info(LD_CONFIG, "Couldn't rebuild router descriptor");
903 if (advertised_server_mode())
904 router_upload_dir_desc_to_dirservers(0);
907 if (time_to_try_getting_descriptors < now) {
908 update_router_descriptor_downloads(now);
909 update_extrainfo_downloads(now);
910 if (options->UseBridges)
911 fetch_bridge_descriptors(now);
912 if (router_have_minimum_dir_info())
913 time_to_try_getting_descriptors = now + LAZY_DESCRIPTOR_RETRY_INTERVAL;
914 else
915 time_to_try_getting_descriptors = now + GREEDY_DESCRIPTOR_RETRY_INTERVAL;
918 if (time_to_reset_descriptor_failures < now) {
919 router_reset_descriptor_download_failures();
920 time_to_reset_descriptor_failures =
921 now + DESCRIPTOR_FAILURE_RESET_INTERVAL;
924 /** 1b. Every MAX_SSL_KEY_LIFETIME seconds, we change our TLS context. */
925 if (!last_rotated_x509_certificate)
926 last_rotated_x509_certificate = now;
927 if (last_rotated_x509_certificate+MAX_SSL_KEY_LIFETIME < now) {
928 log_info(LD_GENERAL,"Rotating tls context.");
929 if (tor_tls_context_new(get_identity_key(), MAX_SSL_KEY_LIFETIME) < 0) {
930 log_warn(LD_BUG, "Error reinitializing TLS context");
931 /* XXX is it a bug here, that we just keep going? -RD */
933 last_rotated_x509_certificate = now;
934 /* We also make sure to rotate the TLS connections themselves if they've
935 * been up for too long -- but that's done via is_bad_for_new_circs in
936 * connection_run_housekeeping() above. */
939 if (time_to_add_entropy < now) {
940 if (time_to_add_entropy) {
941 /* We already seeded once, so don't die on failure. */
942 crypto_seed_rng(0);
944 /** How often do we add more entropy to OpenSSL's RNG pool? */
945 #define ENTROPY_INTERVAL (60*60)
946 time_to_add_entropy = now + ENTROPY_INTERVAL;
949 /** 1c. If we have to change the accounting interval or record
950 * bandwidth used in this accounting interval, do so. */
951 if (accounting_is_enabled(options))
952 accounting_run_housekeeping(now);
954 if (now % 10 == 0 && (authdir_mode_tests_reachability(options)) &&
955 !we_are_hibernating()) {
956 /* try to determine reachability of the other Tor relays */
957 dirserv_test_reachability(now);
960 /** 1d. Periodically, we discount older stability information so that new
961 * stability info counts more, and save the stability information to disk as
962 * appropriate. */
963 if (time_to_downrate_stability < now)
964 time_to_downrate_stability = rep_hist_downrate_old_runs(now);
965 if (authdir_mode_tests_reachability(options)) {
966 if (time_to_save_stability < now) {
967 if (time_to_save_stability && rep_hist_record_mtbf_data(now, 1)<0) {
968 log_warn(LD_GENERAL, "Couldn't store mtbf data.");
970 #define SAVE_STABILITY_INTERVAL (30*60)
971 time_to_save_stability = now + SAVE_STABILITY_INTERVAL;
975 /* 1e. Periodically, if we're a v3 authority, we check whether our cert is
976 * close to expiring and warn the admin if it is. */
977 if (time_to_check_v3_certificate < now) {
978 v3_authority_check_key_expiry();
979 #define CHECK_V3_CERTIFICATE_INTERVAL (5*60)
980 time_to_check_v3_certificate = now + CHECK_V3_CERTIFICATE_INTERVAL;
983 /* 1f. Check whether our networkstatus has expired.
985 if (time_to_check_for_expired_networkstatus < now) {
986 networkstatus_t *ns = networkstatus_get_latest_consensus();
987 /*XXXX RD: This value needs to be the same as REASONABLY_LIVE_TIME in
988 * networkstatus_get_reasonably_live_consensus(), but that value is way
989 * way too high. Arma: is the bridge issue there resolved yet? -NM */
990 #define NS_EXPIRY_SLOP (24*60*60)
991 if (ns && ns->valid_until < now+NS_EXPIRY_SLOP &&
992 router_have_minimum_dir_info()) {
993 router_dir_info_changed();
995 #define CHECK_EXPIRED_NS_INTERVAL (2*60)
996 time_to_check_for_expired_networkstatus = now + CHECK_EXPIRED_NS_INTERVAL;
999 /* 1g. Check whether we should write statistics to disk.
1001 if (time_to_write_stats_files < now) {
1002 #define CHECK_WRITE_STATS_INTERVAL (60*60)
1003 time_t next_time_to_write_stats_files = (time_to_write_stats_files > 0 ?
1004 time_to_write_stats_files : now) + CHECK_WRITE_STATS_INTERVAL;
1005 if (options->CellStatistics) {
1006 time_t next_write =
1007 rep_hist_buffer_stats_write(time_to_write_stats_files);
1008 if (next_write && next_write < next_time_to_write_stats_files)
1009 next_time_to_write_stats_files = next_write;
1011 if (options->DirReqStatistics) {
1012 time_t next_write = geoip_dirreq_stats_write(time_to_write_stats_files);
1013 if (next_write && next_write < next_time_to_write_stats_files)
1014 next_time_to_write_stats_files = next_write;
1016 if (options->EntryStatistics) {
1017 time_t next_write = geoip_entry_stats_write(time_to_write_stats_files);
1018 if (next_write && next_write < next_time_to_write_stats_files)
1019 next_time_to_write_stats_files = next_write;
1021 if (options->ExitPortStatistics) {
1022 time_t next_write = rep_hist_exit_stats_write(time_to_write_stats_files);
1023 if (next_write && next_write < next_time_to_write_stats_files)
1024 next_time_to_write_stats_files = next_write;
1026 time_to_write_stats_files = next_time_to_write_stats_files;
1029 /* 1h. Check whether we should write bridge statistics to disk.
1031 if (should_record_bridge_info(options)) {
1032 if (time_to_write_bridge_stats < now) {
1033 if (should_init_bridge_stats) {
1034 /* (Re-)initialize bridge statistics. */
1035 geoip_bridge_stats_init(now);
1036 time_to_write_bridge_stats = now + WRITE_STATS_INTERVAL;
1037 should_init_bridge_stats = 0;
1038 } else {
1039 /* Possibly write bridge statistics to disk and ask when to write
1040 * them next time. */
1041 time_to_write_bridge_stats = geoip_bridge_stats_write(
1042 time_to_write_bridge_stats);
1045 } else if (!should_init_bridge_stats) {
1046 /* Bridge mode was turned off. Ensure that stats are re-initialized
1047 * next time bridge mode is turned on. */
1048 should_init_bridge_stats = 1;
1051 /* Remove old information from rephist and the rend cache. */
1052 if (time_to_clean_caches < now) {
1053 rep_history_clean(now - options->RephistTrackTime);
1054 rend_cache_clean();
1055 rend_cache_clean_v2_descs_as_dir();
1056 #define CLEAN_CACHES_INTERVAL (30*60)
1057 time_to_clean_caches = now + CLEAN_CACHES_INTERVAL;
1060 #define RETRY_DNS_INTERVAL (10*60)
1061 /* If we're a server and initializing dns failed, retry periodically. */
1062 if (time_to_retry_dns_init < now) {
1063 time_to_retry_dns_init = now + RETRY_DNS_INTERVAL;
1064 if (server_mode(options) && has_dns_init_failed())
1065 dns_init();
1068 /** 2. Periodically, we consider force-uploading our descriptor
1069 * (if we've passed our internal checks). */
1071 /** How often do we check whether part of our router info has changed in a way
1072 * that would require an upload? */
1073 #define CHECK_DESCRIPTOR_INTERVAL (60)
1074 /** How often do we (as a router) check whether our IP address has changed? */
1075 #define CHECK_IPADDRESS_INTERVAL (15*60)
1077 /* 2b. Once per minute, regenerate and upload the descriptor if the old
1078 * one is inaccurate. */
1079 if (time_to_check_descriptor < now) {
1080 static int dirport_reachability_count = 0;
1081 time_to_check_descriptor = now + CHECK_DESCRIPTOR_INTERVAL;
1082 check_descriptor_bandwidth_changed(now);
1083 if (time_to_check_ipaddress < now) {
1084 time_to_check_ipaddress = now + CHECK_IPADDRESS_INTERVAL;
1085 check_descriptor_ipaddress_changed(now);
1087 /** If our router descriptor ever goes this long without being regenerated
1088 * because something changed, we force an immediate regenerate-and-upload. */
1089 #define FORCE_REGENERATE_DESCRIPTOR_INTERVAL (18*60*60)
1090 mark_my_descriptor_dirty_if_older_than(
1091 now - FORCE_REGENERATE_DESCRIPTOR_INTERVAL);
1092 consider_publishable_server(0);
1093 /* also, check religiously for reachability, if it's within the first
1094 * 20 minutes of our uptime. */
1095 if (server_mode(options) &&
1096 (has_completed_circuit || !any_predicted_circuits(now)) &&
1097 !we_are_hibernating()) {
1098 if (stats_n_seconds_working < TIMEOUT_UNTIL_UNREACHABILITY_COMPLAINT) {
1099 consider_testing_reachability(1, dirport_reachability_count==0);
1100 if (++dirport_reachability_count > 5)
1101 dirport_reachability_count = 0;
1102 } else if (time_to_recheck_bandwidth < now) {
1103 /* If we haven't checked for 12 hours and our bandwidth estimate is
1104 * low, do another bandwidth test. This is especially important for
1105 * bridges, since they might go long periods without much use. */
1106 routerinfo_t *me = router_get_my_routerinfo();
1107 if (time_to_recheck_bandwidth && me &&
1108 me->bandwidthcapacity < me->bandwidthrate &&
1109 me->bandwidthcapacity < 51200) {
1110 reset_bandwidth_test();
1112 #define BANDWIDTH_RECHECK_INTERVAL (12*60*60)
1113 time_to_recheck_bandwidth = now + BANDWIDTH_RECHECK_INTERVAL;
1117 /* If any networkstatus documents are no longer recent, we need to
1118 * update all the descriptors' running status. */
1119 /* purge obsolete entries */
1120 networkstatus_v2_list_clean(now);
1121 /* Remove dead routers. */
1122 routerlist_remove_old_routers();
1124 /* Also, once per minute, check whether we want to download any
1125 * networkstatus documents.
1127 update_networkstatus_downloads(now);
1130 /** 2c. Let directory voting happen. */
1131 if (authdir_mode_v3(options))
1132 dirvote_act(options, now);
1134 /** 3a. Every second, we examine pending circuits and prune the
1135 * ones which have been pending for more than a few seconds.
1136 * We do this before step 4, so it can try building more if
1137 * it's not comfortable with the number of available circuits.
1139 circuit_expire_building(now);
1141 /** 3b. Also look at pending streams and prune the ones that 'began'
1142 * a long time ago but haven't gotten a 'connected' yet.
1143 * Do this before step 4, so we can put them back into pending
1144 * state to be picked up by the new circuit.
1146 connection_ap_expire_beginning();
1148 /** 3c. And expire connections that we've held open for too long.
1150 connection_expire_held_open();
1152 /** 3d. And every 60 seconds, we relaunch listeners if any died. */
1153 if (!we_are_hibernating() && time_to_check_listeners < now) {
1154 retry_all_listeners(NULL, NULL);
1155 time_to_check_listeners = now+60;
1158 /** 4. Every second, we try a new circuit if there are no valid
1159 * circuits. Every NewCircuitPeriod seconds, we expire circuits
1160 * that became dirty more than MaxCircuitDirtiness seconds ago,
1161 * and we make a new circ if there are no clean circuits.
1163 have_dir_info = router_have_minimum_dir_info();
1164 if (have_dir_info && !we_are_hibernating())
1165 circuit_build_needed_circs(now);
1167 /* every 10 seconds, but not at the same second as other such events */
1168 if (now % 10 == 5)
1169 circuit_expire_old_circuits_serverside(now);
1171 /** 5. We do housekeeping for each connection... */
1172 connection_or_set_bad_connections();
1173 for (i=0;i<smartlist_len(connection_array);i++) {
1174 run_connection_housekeeping(i, now);
1176 if (time_to_shrink_memory < now) {
1177 SMARTLIST_FOREACH(connection_array, connection_t *, conn, {
1178 if (conn->outbuf)
1179 buf_shrink(conn->outbuf);
1180 if (conn->inbuf)
1181 buf_shrink(conn->inbuf);
1183 clean_cell_pool();
1184 buf_shrink_freelists(0);
1185 /** How often do we check buffers and pools for empty space that can be
1186 * deallocated? */
1187 #define MEM_SHRINK_INTERVAL (60)
1188 time_to_shrink_memory = now + MEM_SHRINK_INTERVAL;
1191 /** 6. And remove any marked circuits... */
1192 circuit_close_all_marked();
1194 /** 7. And upload service descriptors if necessary. */
1195 if (has_completed_circuit && !we_are_hibernating()) {
1196 rend_consider_services_upload(now);
1197 rend_consider_descriptor_republication();
1200 /** 8. and blow away any connections that need to die. have to do this now,
1201 * because if we marked a conn for close and left its socket -1, then
1202 * we'll pass it to poll/select and bad things will happen.
1204 close_closeable_connections();
1206 /** 8b. And if anything in our state is ready to get flushed to disk, we
1207 * flush it. */
1208 or_state_save(now);
1210 /** 9. and if we're a server, check whether our DNS is telling stories to
1211 * us. */
1212 if (server_mode(options) && time_to_check_for_correct_dns < now) {
1213 if (!time_to_check_for_correct_dns) {
1214 time_to_check_for_correct_dns = now + 60 + crypto_rand_int(120);
1215 } else {
1216 dns_launch_correctness_checks();
1217 time_to_check_for_correct_dns = now + 12*3600 +
1218 crypto_rand_int(12*3600);
1222 /** 10b. write bridge networkstatus file to disk */
1223 if (options->BridgeAuthoritativeDir &&
1224 time_to_write_bridge_status_file < now) {
1225 networkstatus_dump_bridge_status_to_file(now);
1226 #define BRIDGE_STATUSFILE_INTERVAL (30*60)
1227 time_to_write_bridge_status_file = now+BRIDGE_STATUSFILE_INTERVAL;
1231 /** Timer: used to invoke second_elapsed_callback() once per second. */
1232 static periodic_timer_t *second_timer = NULL;
1233 /** Number of libevent errors in the last second: we die if we get too many. */
1234 static int n_libevent_errors = 0;
1236 /** Libevent callback: invoked once every second. */
1237 static void
1238 second_elapsed_callback(periodic_timer_t *timer, void *arg)
1240 /* XXXX This could be sensibly refactored into multiple callbacks, and we
1241 * could use Libevent's timers for this rather than checking the current
1242 * time against a bunch of timeouts every second. */
1243 static time_t current_second = 0;
1244 time_t now;
1245 size_t bytes_written;
1246 size_t bytes_read;
1247 int seconds_elapsed;
1248 or_options_t *options = get_options();
1249 (void)timer;
1250 (void)arg;
1252 n_libevent_errors = 0;
1254 /* log_notice(LD_GENERAL, "Tick."); */
1255 now = time(NULL);
1256 update_approx_time(now);
1258 /* the second has rolled over. check more stuff. */
1259 bytes_written = stats_prev_global_write_bucket - global_write_bucket;
1260 bytes_read = stats_prev_global_read_bucket - global_read_bucket;
1261 seconds_elapsed = current_second ? (int)(now - current_second) : 0;
1262 stats_n_bytes_read += bytes_read;
1263 stats_n_bytes_written += bytes_written;
1264 if (accounting_is_enabled(options) && seconds_elapsed >= 0)
1265 accounting_add_bytes(bytes_read, bytes_written, seconds_elapsed);
1266 control_event_bandwidth_used((uint32_t)bytes_read,(uint32_t)bytes_written);
1267 control_event_stream_bandwidth_used();
1269 if (seconds_elapsed > 0)
1270 connection_bucket_refill(seconds_elapsed, now);
1271 stats_prev_global_read_bucket = global_read_bucket;
1272 stats_prev_global_write_bucket = global_write_bucket;
1274 if (server_mode(options) &&
1275 !we_are_hibernating() &&
1276 seconds_elapsed > 0 &&
1277 has_completed_circuit &&
1278 stats_n_seconds_working / TIMEOUT_UNTIL_UNREACHABILITY_COMPLAINT !=
1279 (stats_n_seconds_working+seconds_elapsed) /
1280 TIMEOUT_UNTIL_UNREACHABILITY_COMPLAINT) {
1281 /* every 20 minutes, check and complain if necessary */
1282 routerinfo_t *me = router_get_my_routerinfo();
1283 if (me && !check_whether_orport_reachable()) {
1284 log_warn(LD_CONFIG,"Your server (%s:%d) has not managed to confirm that "
1285 "its ORPort is reachable. Please check your firewalls, ports, "
1286 "address, /etc/hosts file, etc.",
1287 me->address, me->or_port);
1288 control_event_server_status(LOG_WARN,
1289 "REACHABILITY_FAILED ORADDRESS=%s:%d",
1290 me->address, me->or_port);
1293 if (me && !check_whether_dirport_reachable()) {
1294 log_warn(LD_CONFIG,
1295 "Your server (%s:%d) has not managed to confirm that its "
1296 "DirPort is reachable. Please check your firewalls, ports, "
1297 "address, /etc/hosts file, etc.",
1298 me->address, me->dir_port);
1299 control_event_server_status(LOG_WARN,
1300 "REACHABILITY_FAILED DIRADDRESS=%s:%d",
1301 me->address, me->dir_port);
1305 /** If more than this many seconds have elapsed, probably the clock
1306 * jumped: doesn't count. */
1307 #define NUM_JUMPED_SECONDS_BEFORE_WARN 100
1308 if (seconds_elapsed < -NUM_JUMPED_SECONDS_BEFORE_WARN ||
1309 seconds_elapsed >= NUM_JUMPED_SECONDS_BEFORE_WARN) {
1310 circuit_note_clock_jumped(seconds_elapsed);
1311 /* XXX if the time jumps *back* many months, do our events in
1312 * run_scheduled_events() recover? I don't think they do. -RD */
1313 } else if (seconds_elapsed > 0)
1314 stats_n_seconds_working += seconds_elapsed;
1316 run_scheduled_events(now);
1318 current_second = now; /* remember which second it is, for next time */
1321 #ifndef MS_WINDOWS
1322 /** Called when a possibly ignorable libevent error occurs; ensures that we
1323 * don't get into an infinite loop by ignoring too many errors from
1324 * libevent. */
1325 static int
1326 got_libevent_error(void)
1328 if (++n_libevent_errors > 8) {
1329 log_err(LD_NET, "Too many libevent errors in one second; dying");
1330 return -1;
1332 return 0;
1334 #endif
1336 #define UPTIME_CUTOFF_FOR_NEW_BANDWIDTH_TEST (6*60*60)
1338 /** Called when our IP address seems to have changed. <b>at_interface</b>
1339 * should be true if we detected a change in our interface, and false if we
1340 * detected a change in our published address. */
1341 void
1342 ip_address_changed(int at_interface)
1344 int server = server_mode(get_options());
1346 if (at_interface) {
1347 if (! server) {
1348 /* Okay, change our keys. */
1349 init_keys();
1351 } else {
1352 if (server) {
1353 if (stats_n_seconds_working > UPTIME_CUTOFF_FOR_NEW_BANDWIDTH_TEST)
1354 reset_bandwidth_test();
1355 stats_n_seconds_working = 0;
1356 router_reset_reachability();
1357 mark_my_descriptor_dirty();
1361 dns_servers_relaunch_checks();
1364 /** Forget what we've learned about the correctness of our DNS servers, and
1365 * start learning again. */
1366 void
1367 dns_servers_relaunch_checks(void)
1369 if (server_mode(get_options())) {
1370 dns_reset_correctness_checks();
1371 time_to_check_for_correct_dns = 0;
1375 /** Called when we get a SIGHUP: reload configuration files and keys,
1376 * retry all connections, and so on. */
1377 static int
1378 do_hup(void)
1380 or_options_t *options = get_options();
1382 #ifdef USE_DMALLOC
1383 dmalloc_log_stats();
1384 dmalloc_log_changed(0, 1, 0, 0);
1385 #endif
1387 log_notice(LD_GENERAL,"Received reload signal (hup). Reloading config and "
1388 "resetting internal state.");
1389 if (accounting_is_enabled(options))
1390 accounting_record_bandwidth_usage(time(NULL), get_or_state());
1392 router_reset_warnings();
1393 routerlist_reset_warnings();
1394 addressmap_clear_transient();
1395 /* first, reload config variables, in case they've changed */
1396 if (options->ReloadTorrcOnSIGHUP) {
1397 /* no need to provide argc/v, they've been cached in init_from_config */
1398 if (options_init_from_torrc(0, NULL) < 0) {
1399 log_err(LD_CONFIG,"Reading config failed--see warnings above. "
1400 "For usage, try -h.");
1401 return -1;
1403 options = get_options(); /* they have changed now */
1404 } else {
1405 log_notice(LD_GENERAL, "Not reloading config file: the controller told "
1406 "us not to.");
1408 if (authdir_mode_handles_descs(options, -1)) {
1409 /* reload the approved-routers file */
1410 if (dirserv_load_fingerprint_file() < 0) {
1411 /* warnings are logged from dirserv_load_fingerprint_file() directly */
1412 log_info(LD_GENERAL, "Error reloading fingerprints. "
1413 "Continuing with old list.");
1417 /* Rotate away from the old dirty circuits. This has to be done
1418 * after we've read the new options, but before we start using
1419 * circuits for directory fetches. */
1420 circuit_expire_all_dirty_circs();
1422 /* retry appropriate downloads */
1423 router_reset_status_download_failures();
1424 router_reset_descriptor_download_failures();
1425 update_networkstatus_downloads(time(NULL));
1427 /* We'll retry routerstatus downloads in about 10 seconds; no need to
1428 * force a retry there. */
1430 if (server_mode(options)) {
1431 /* Restart cpuworker and dnsworker processes, so they get up-to-date
1432 * configuration options. */
1433 cpuworkers_rotate();
1434 dns_reset();
1436 return 0;
1439 /** Tor main loop. */
1440 /* static */ int
1441 do_main_loop(void)
1443 int loop_result;
1444 time_t now;
1446 /* initialize dns resolve map, spawn workers if needed */
1447 if (dns_init() < 0) {
1448 if (get_options()->ServerDNSAllowBrokenConfig)
1449 log_warn(LD_GENERAL, "Couldn't set up any working nameservers. "
1450 "Network not up yet? Will try again soon.");
1451 else {
1452 log_err(LD_GENERAL,"Error initializing dns subsystem; exiting. To "
1453 "retry instead, set the ServerDNSAllowBrokenResolvConf option.");
1457 handle_signals(1);
1459 /* load the private keys, if we're supposed to have them, and set up the
1460 * TLS context. */
1461 if (! identity_key_is_set()) {
1462 if (init_keys() < 0) {
1463 log_err(LD_BUG,"Error initializing keys; exiting");
1464 return -1;
1468 /* Set up the packed_cell_t memory pool. */
1469 init_cell_pool();
1471 /* Set up our buckets */
1472 connection_bucket_init();
1473 stats_prev_global_read_bucket = global_read_bucket;
1474 stats_prev_global_write_bucket = global_write_bucket;
1476 /* initialize the bootstrap status events to know we're starting up */
1477 control_event_bootstrap(BOOTSTRAP_STATUS_STARTING, 0);
1479 if (trusted_dirs_reload_certs()) {
1480 log_warn(LD_DIR,
1481 "Couldn't load all cached v3 certificates. Starting anyway.");
1483 if (router_reload_v2_networkstatus()) {
1484 return -1;
1486 if (router_reload_consensus_networkstatus()) {
1487 return -1;
1489 /* load the routers file, or assign the defaults. */
1490 if (router_reload_router_list()) {
1491 return -1;
1493 /* load the networkstatuses. (This launches a download for new routers as
1494 * appropriate.)
1496 now = time(NULL);
1497 directory_info_has_arrived(now, 1);
1499 if (server_mode(get_options())) {
1500 /* launch cpuworkers. Need to do this *after* we've read the onion key. */
1501 cpu_init();
1504 /* set up once-a-second callback. */
1505 if (! second_timer) {
1506 struct timeval one_second;
1507 one_second.tv_sec = 1;
1508 one_second.tv_usec = 0;
1510 second_timer = periodic_timer_new(tor_libevent_get_base(),
1511 &one_second,
1512 second_elapsed_callback,
1513 NULL);
1514 tor_assert(second_timer);
1517 for (;;) {
1518 if (nt_service_is_stopping())
1519 return 0;
1521 #ifndef MS_WINDOWS
1522 /* Make it easier to tell whether libevent failure is our fault or not. */
1523 errno = 0;
1524 #endif
1525 /* All active linked conns should get their read events activated. */
1526 SMARTLIST_FOREACH(active_linked_connection_lst, connection_t *, conn,
1527 event_active(conn->read_event, EV_READ, 1));
1528 called_loop_once = smartlist_len(active_linked_connection_lst) ? 1 : 0;
1530 update_approx_time(time(NULL));
1532 /* poll until we have an event, or the second ends, or until we have
1533 * some active linked connections to trigger events for. */
1534 loop_result = event_base_loop(tor_libevent_get_base(),
1535 called_loop_once ? EVLOOP_ONCE : 0);
1537 /* let catch() handle things like ^c, and otherwise don't worry about it */
1538 if (loop_result < 0) {
1539 int e = tor_socket_errno(-1);
1540 /* let the program survive things like ^z */
1541 if (e != EINTR && !ERRNO_IS_EINPROGRESS(e)) {
1542 log_err(LD_NET,"libevent call with %s failed: %s [%d]",
1543 tor_libevent_get_method(), tor_socket_strerror(e), e);
1544 return -1;
1545 #ifndef MS_WINDOWS
1546 } else if (e == EINVAL) {
1547 log_warn(LD_NET, "EINVAL from libevent: should you upgrade libevent?");
1548 if (got_libevent_error())
1549 return -1;
1550 #endif
1551 } else {
1552 if (ERRNO_IS_EINPROGRESS(e))
1553 log_warn(LD_BUG,
1554 "libevent call returned EINPROGRESS? Please report.");
1555 log_debug(LD_NET,"libevent call interrupted.");
1556 /* You can't trust the results of this poll(). Go back to the
1557 * top of the big for loop. */
1558 continue;
1564 /** Used to implement the SIGNAL control command: if we accept
1565 * <b>the_signal</b> as a remote pseudo-signal, act on it. */
1566 /* We don't re-use catch() here because:
1567 * 1. We handle a different set of signals than those allowed in catch.
1568 * 2. Platforms without signal() are unlikely to define SIGfoo.
1569 * 3. The control spec is defined to use fixed numeric signal values
1570 * which just happen to match the Unix values.
1572 void
1573 control_signal_act(int the_signal)
1575 switch (the_signal)
1577 case 1:
1578 signal_callback(0,0,(void*)(uintptr_t)SIGHUP);
1579 break;
1580 case 2:
1581 signal_callback(0,0,(void*)(uintptr_t)SIGINT);
1582 break;
1583 case 10:
1584 signal_callback(0,0,(void*)(uintptr_t)SIGUSR1);
1585 break;
1586 case 12:
1587 signal_callback(0,0,(void*)(uintptr_t)SIGUSR2);
1588 break;
1589 case 15:
1590 signal_callback(0,0,(void*)(uintptr_t)SIGTERM);
1591 break;
1592 case SIGNEWNYM:
1593 signal_callback(0,0,(void*)(uintptr_t)SIGNEWNYM);
1594 break;
1595 case SIGCLEARDNSCACHE:
1596 signal_callback(0,0,(void*)(uintptr_t)SIGCLEARDNSCACHE);
1597 break;
1598 default:
1599 log_warn(LD_BUG, "Unrecognized signal number %d.", the_signal);
1600 break;
1604 /** Libevent callback: invoked when we get a signal.
1606 static void
1607 signal_callback(int fd, short events, void *arg)
1609 uintptr_t sig = (uintptr_t)arg;
1610 (void)fd;
1611 (void)events;
1612 switch (sig)
1614 case SIGTERM:
1615 log_notice(LD_GENERAL,"Catching signal TERM, exiting cleanly.");
1616 tor_cleanup();
1617 exit(0);
1618 break;
1619 case SIGINT:
1620 if (!server_mode(get_options())) { /* do it now */
1621 log_notice(LD_GENERAL,"Interrupt: exiting cleanly.");
1622 tor_cleanup();
1623 exit(0);
1625 hibernate_begin_shutdown();
1626 break;
1627 #ifdef SIGPIPE
1628 case SIGPIPE:
1629 log_debug(LD_GENERAL,"Caught SIGPIPE. Ignoring.");
1630 break;
1631 #endif
1632 case SIGUSR1:
1633 /* prefer to log it at INFO, but make sure we always see it */
1634 dumpstats(get_min_log_level()<LOG_INFO ? get_min_log_level() : LOG_INFO);
1635 break;
1636 case SIGUSR2:
1637 switch_logs_debug();
1638 log_debug(LD_GENERAL,"Caught USR2, going to loglevel debug. "
1639 "Send HUP to change back.");
1640 break;
1641 case SIGHUP:
1642 if (do_hup() < 0) {
1643 log_warn(LD_CONFIG,"Restart failed (config error?). Exiting.");
1644 tor_cleanup();
1645 exit(1);
1647 break;
1648 #ifdef SIGCHLD
1649 case SIGCHLD:
1650 while (waitpid(-1,NULL,WNOHANG) > 0) ; /* keep reaping until no more
1651 zombies */
1652 break;
1653 #endif
1654 case SIGNEWNYM: {
1655 time_t now = time(NULL);
1656 if (time_of_last_signewnym + MAX_SIGNEWNYM_RATE > now) {
1657 signewnym_is_pending = 1;
1658 log(LOG_NOTICE, LD_CONTROL,
1659 "Rate limiting NEWNYM request: delaying by %d second(s)",
1660 (int)(MAX_SIGNEWNYM_RATE+time_of_last_signewnym-now));
1661 } else {
1662 signewnym_impl(now);
1664 break;
1666 case SIGCLEARDNSCACHE:
1667 addressmap_clear_transient();
1668 break;
1672 extern uint64_t rephist_total_alloc;
1673 extern uint32_t rephist_total_num;
1676 * Write current memory usage information to the log.
1678 static void
1679 dumpmemusage(int severity)
1681 connection_dump_buffer_mem_stats(severity);
1682 log(severity, LD_GENERAL, "In rephist: "U64_FORMAT" used by %d Tors.",
1683 U64_PRINTF_ARG(rephist_total_alloc), rephist_total_num);
1684 dump_routerlist_mem_usage(severity);
1685 dump_cell_pool_usage(severity);
1686 dump_dns_mem_usage(severity);
1687 buf_dump_freelist_sizes(severity);
1688 tor_log_mallinfo(severity);
1691 /** Write all statistics to the log, with log level <b>severity</b>. Called
1692 * in response to a SIGUSR1. */
1693 static void
1694 dumpstats(int severity)
1696 time_t now = time(NULL);
1697 time_t elapsed;
1698 size_t rbuf_cap, wbuf_cap, rbuf_len, wbuf_len;
1700 log(severity, LD_GENERAL, "Dumping stats:");
1702 SMARTLIST_FOREACH(connection_array, connection_t *, conn,
1704 int i = conn_sl_idx;
1705 log(severity, LD_GENERAL,
1706 "Conn %d (socket %d) type %d (%s), state %d (%s), created %d secs ago",
1707 i, conn->s, conn->type, conn_type_to_string(conn->type),
1708 conn->state, conn_state_to_string(conn->type, conn->state),
1709 (int)(now - conn->timestamp_created));
1710 if (!connection_is_listener(conn)) {
1711 log(severity,LD_GENERAL,
1712 "Conn %d is to %s:%d.", i,
1713 safe_str_client(conn->address),
1714 conn->port);
1715 log(severity,LD_GENERAL,
1716 "Conn %d: %d bytes waiting on inbuf (len %d, last read %d secs ago)",
1718 (int)buf_datalen(conn->inbuf),
1719 (int)buf_allocation(conn->inbuf),
1720 (int)(now - conn->timestamp_lastread));
1721 log(severity,LD_GENERAL,
1722 "Conn %d: %d bytes waiting on outbuf "
1723 "(len %d, last written %d secs ago)",i,
1724 (int)buf_datalen(conn->outbuf),
1725 (int)buf_allocation(conn->outbuf),
1726 (int)(now - conn->timestamp_lastwritten));
1727 if (conn->type == CONN_TYPE_OR) {
1728 or_connection_t *or_conn = TO_OR_CONN(conn);
1729 if (or_conn->tls) {
1730 tor_tls_get_buffer_sizes(or_conn->tls, &rbuf_cap, &rbuf_len,
1731 &wbuf_cap, &wbuf_len);
1732 log(severity, LD_GENERAL,
1733 "Conn %d: %d/%d bytes used on OpenSSL read buffer; "
1734 "%d/%d bytes used on write buffer.",
1735 i, (int)rbuf_len, (int)rbuf_cap, (int)wbuf_len, (int)wbuf_cap);
1739 circuit_dump_by_conn(conn, severity); /* dump info about all the circuits
1740 * using this conn */
1742 log(severity, LD_NET,
1743 "Cells processed: "U64_FORMAT" padding\n"
1744 " "U64_FORMAT" create\n"
1745 " "U64_FORMAT" created\n"
1746 " "U64_FORMAT" relay\n"
1747 " ("U64_FORMAT" relayed)\n"
1748 " ("U64_FORMAT" delivered)\n"
1749 " "U64_FORMAT" destroy",
1750 U64_PRINTF_ARG(stats_n_padding_cells_processed),
1751 U64_PRINTF_ARG(stats_n_create_cells_processed),
1752 U64_PRINTF_ARG(stats_n_created_cells_processed),
1753 U64_PRINTF_ARG(stats_n_relay_cells_processed),
1754 U64_PRINTF_ARG(stats_n_relay_cells_relayed),
1755 U64_PRINTF_ARG(stats_n_relay_cells_delivered),
1756 U64_PRINTF_ARG(stats_n_destroy_cells_processed));
1757 if (stats_n_data_cells_packaged)
1758 log(severity,LD_NET,"Average packaged cell fullness: %2.3f%%",
1759 100*(U64_TO_DBL(stats_n_data_bytes_packaged) /
1760 U64_TO_DBL(stats_n_data_cells_packaged*RELAY_PAYLOAD_SIZE)) );
1761 if (stats_n_data_cells_received)
1762 log(severity,LD_NET,"Average delivered cell fullness: %2.3f%%",
1763 100*(U64_TO_DBL(stats_n_data_bytes_received) /
1764 U64_TO_DBL(stats_n_data_cells_received*RELAY_PAYLOAD_SIZE)) );
1766 if (now - time_of_process_start >= 0)
1767 elapsed = now - time_of_process_start;
1768 else
1769 elapsed = 0;
1771 if (elapsed) {
1772 log(severity, LD_NET,
1773 "Average bandwidth: "U64_FORMAT"/%d = %d bytes/sec reading",
1774 U64_PRINTF_ARG(stats_n_bytes_read),
1775 (int)elapsed,
1776 (int) (stats_n_bytes_read/elapsed));
1777 log(severity, LD_NET,
1778 "Average bandwidth: "U64_FORMAT"/%d = %d bytes/sec writing",
1779 U64_PRINTF_ARG(stats_n_bytes_written),
1780 (int)elapsed,
1781 (int) (stats_n_bytes_written/elapsed));
1784 log(severity, LD_NET, "--------------- Dumping memory information:");
1785 dumpmemusage(severity);
1787 rep_hist_dump_stats(now,severity);
1788 rend_service_dump_stats(severity);
1789 dump_pk_ops(severity);
1790 dump_distinct_digest_count(severity);
1793 /** Called by exit() as we shut down the process.
1795 static void
1796 exit_function(void)
1798 /* NOTE: If we ever daemonize, this gets called immediately. That's
1799 * okay for now, because we only use this on Windows. */
1800 #ifdef MS_WINDOWS
1801 WSACleanup();
1802 #endif
1805 /** Set up the signal handlers for either parent or child. */
1806 void
1807 handle_signals(int is_parent)
1809 #ifndef MS_WINDOWS /* do signal stuff only on Unix */
1810 int i;
1811 static const int signals[] = {
1812 SIGINT, /* do a controlled slow shutdown */
1813 SIGTERM, /* to terminate now */
1814 SIGPIPE, /* otherwise SIGPIPE kills us */
1815 SIGUSR1, /* dump stats */
1816 SIGUSR2, /* go to loglevel debug */
1817 SIGHUP, /* to reload config, retry conns, etc */
1818 #ifdef SIGXFSZ
1819 SIGXFSZ, /* handle file-too-big resource exhaustion */
1820 #endif
1821 SIGCHLD, /* handle dns/cpu workers that exit */
1822 -1 };
1823 static struct event *signal_events[16]; /* bigger than it has to be. */
1824 if (is_parent) {
1825 for (i = 0; signals[i] >= 0; ++i) {
1826 signal_events[i] = tor_evsignal_new(
1827 tor_libevent_get_base(), signals[i], signal_callback,
1828 (void*)(uintptr_t)signals[i]);
1829 if (event_add(signal_events[i], NULL))
1830 log_warn(LD_BUG, "Error from libevent when adding event for signal %d",
1831 signals[i]);
1833 } else {
1834 struct sigaction action;
1835 action.sa_flags = 0;
1836 sigemptyset(&action.sa_mask);
1837 action.sa_handler = SIG_IGN;
1838 sigaction(SIGINT, &action, NULL);
1839 sigaction(SIGTERM, &action, NULL);
1840 sigaction(SIGPIPE, &action, NULL);
1841 sigaction(SIGUSR1, &action, NULL);
1842 sigaction(SIGUSR2, &action, NULL);
1843 sigaction(SIGHUP, &action, NULL);
1844 #ifdef SIGXFSZ
1845 sigaction(SIGXFSZ, &action, NULL);
1846 #endif
1848 #else /* MS windows */
1849 (void)is_parent;
1850 #endif /* signal stuff */
1853 /** Main entry point for the Tor command-line client.
1855 /* static */ int
1856 tor_init(int argc, char *argv[])
1858 char buf[256];
1859 int i, quiet = 0;
1860 time_of_process_start = time(NULL);
1861 if (!connection_array)
1862 connection_array = smartlist_create();
1863 if (!closeable_connection_lst)
1864 closeable_connection_lst = smartlist_create();
1865 if (!active_linked_connection_lst)
1866 active_linked_connection_lst = smartlist_create();
1867 /* Have the log set up with our application name. */
1868 tor_snprintf(buf, sizeof(buf), "Tor %s", get_version());
1869 log_set_application_name(buf);
1870 /* Initialize the history structures. */
1871 rep_hist_init();
1872 /* Initialize the service cache. */
1873 rend_cache_init();
1874 addressmap_init(); /* Init the client dns cache. Do it always, since it's
1875 * cheap. */
1877 /* We search for the "quiet" option first, since it decides whether we
1878 * will log anything at all to the command line. */
1879 for (i=1;i<argc;++i) {
1880 if (!strcmp(argv[i], "--hush"))
1881 quiet = 1;
1882 if (!strcmp(argv[i], "--quiet"))
1883 quiet = 2;
1885 /* give it somewhere to log to initially */
1886 switch (quiet) {
1887 case 2:
1888 /* no initial logging */
1889 break;
1890 case 1:
1891 add_temp_log(LOG_WARN);
1892 break;
1893 default:
1894 add_temp_log(LOG_NOTICE);
1897 log(LOG_NOTICE, LD_GENERAL, "Tor v%s. This is experimental software. "
1898 "Do not rely on it for strong anonymity. (Running on %s)",get_version(),
1899 get_uname());
1901 if (network_init()<0) {
1902 log_err(LD_BUG,"Error initializing network; exiting.");
1903 return -1;
1905 atexit(exit_function);
1907 if (options_init_from_torrc(argc,argv) < 0) {
1908 log_err(LD_CONFIG,"Reading config failed--see warnings above.");
1909 return -1;
1912 #ifndef MS_WINDOWS
1913 if (geteuid()==0)
1914 log_warn(LD_GENERAL,"You are running Tor as root. You don't need to, "
1915 "and you probably shouldn't.");
1916 #endif
1918 if (crypto_global_init(get_options()->HardwareAccel,
1919 get_options()->AccelName,
1920 get_options()->AccelDir)) {
1921 log_err(LD_BUG, "Unable to initialize OpenSSL. Exiting.");
1922 return -1;
1925 return 0;
1928 /** A lockfile structure, used to prevent two Tors from messing with the
1929 * data directory at once. If this variable is non-NULL, we're holding
1930 * the lockfile. */
1931 static tor_lockfile_t *lockfile = NULL;
1933 /** Try to grab the lock file described in <b>options</b>, if we do not
1934 * already have it. If <b>err_if_locked</b> is true, warn if somebody else is
1935 * holding the lock, and exit if we can't get it after waiting. Otherwise,
1936 * return -1 if we can't get the lockfile. Return 0 on success.
1939 try_locking(or_options_t *options, int err_if_locked)
1941 if (lockfile)
1942 return 0;
1943 else {
1944 char *fname = options_get_datadir_fname2_suffix(options, "lock",NULL,NULL);
1945 int already_locked = 0;
1946 tor_lockfile_t *lf = tor_lockfile_lock(fname, 0, &already_locked);
1947 tor_free(fname);
1948 if (!lf) {
1949 if (err_if_locked && already_locked) {
1950 int r;
1951 log_warn(LD_GENERAL, "It looks like another Tor process is running "
1952 "with the same data directory. Waiting 5 seconds to see "
1953 "if it goes away.");
1954 #ifndef WIN32
1955 sleep(5);
1956 #else
1957 Sleep(5000);
1958 #endif
1959 r = try_locking(options, 0);
1960 if (r<0) {
1961 log_err(LD_GENERAL, "No, it's still there. Exiting.");
1962 exit(0);
1964 return r;
1966 return -1;
1968 lockfile = lf;
1969 return 0;
1973 /** Return true iff we've successfully acquired the lock file. */
1975 have_lockfile(void)
1977 return lockfile != NULL;
1980 /** If we have successfully acquired the lock file, release it. */
1981 void
1982 release_lockfile(void)
1984 if (lockfile) {
1985 tor_lockfile_unlock(lockfile);
1986 lockfile = NULL;
1990 /** Free all memory that we might have allocated somewhere.
1991 * If <b>postfork</b>, we are a worker process and we want to free
1992 * only the parts of memory that we won't touch. If !<b>postfork</b>,
1993 * Tor is shutting down and we should free everything.
1995 * Helps us find the real leaks with dmalloc and the like. Also valgrind
1996 * should then report 0 reachable in its leak report (in an ideal world --
1997 * in practice libevent, SSL, libc etc never quite free everything). */
1998 void
1999 tor_free_all(int postfork)
2001 if (!postfork) {
2002 evdns_shutdown(1);
2004 geoip_free_all();
2005 dirvote_free_all();
2006 routerlist_free_all();
2007 networkstatus_free_all();
2008 addressmap_free_all();
2009 dirserv_free_all();
2010 rend_service_free_all();
2011 rend_cache_free_all();
2012 rend_service_authorization_free_all();
2013 rep_hist_free_all();
2014 dns_free_all();
2015 clear_pending_onions();
2016 circuit_free_all();
2017 entry_guards_free_all();
2018 connection_free_all();
2019 buf_shrink_freelists(1);
2020 memarea_clear_freelist();
2021 microdesc_free_all();
2022 if (!postfork) {
2023 config_free_all();
2024 router_free_all();
2025 policies_free_all();
2027 free_cell_pool();
2028 if (!postfork) {
2029 tor_tls_free_all();
2031 /* stuff in main.c */
2033 smartlist_free(connection_array);
2034 smartlist_free(closeable_connection_lst);
2035 smartlist_free(active_linked_connection_lst);
2036 periodic_timer_free(second_timer);
2037 if (!postfork) {
2038 release_lockfile();
2040 /* Stuff in util.c and address.c*/
2041 if (!postfork) {
2042 escaped(NULL);
2043 esc_router_info(NULL);
2044 logs_free_all(); /* free log strings. do this last so logs keep working. */
2048 /** Do whatever cleanup is necessary before shutting Tor down. */
2049 void
2050 tor_cleanup(void)
2052 or_options_t *options = get_options();
2053 /* Remove our pid file. We don't care if there was an error when we
2054 * unlink, nothing we could do about it anyways. */
2055 if (options->command == CMD_RUN_TOR) {
2056 time_t now = time(NULL);
2057 if (options->PidFile)
2058 unlink(options->PidFile);
2059 if (accounting_is_enabled(options))
2060 accounting_record_bandwidth_usage(now, get_or_state());
2061 or_state_mark_dirty(get_or_state(), 0); /* force an immediate save. */
2062 or_state_save(now);
2063 if (authdir_mode_tests_reachability(options))
2064 rep_hist_record_mtbf_data(now, 0);
2066 #ifdef USE_DMALLOC
2067 dmalloc_log_stats();
2068 #endif
2069 tor_free_all(0); /* We could move tor_free_all back into the ifdef below
2070 later, if it makes shutdown unacceptably slow. But for
2071 now, leave it here: it's helped us catch bugs in the
2072 past. */
2073 crypto_global_cleanup();
2074 #ifdef USE_DMALLOC
2075 dmalloc_log_unfreed();
2076 dmalloc_shutdown();
2077 #endif
2080 /** Read/create keys as needed, and echo our fingerprint to stdout. */
2081 /* static */ int
2082 do_list_fingerprint(void)
2084 char buf[FINGERPRINT_LEN+1];
2085 crypto_pk_env_t *k;
2086 const char *nickname = get_options()->Nickname;
2087 if (!server_mode(get_options())) {
2088 log_err(LD_GENERAL,
2089 "Clients don't have long-term identity keys. Exiting.\n");
2090 return -1;
2092 tor_assert(nickname);
2093 if (init_keys() < 0) {
2094 log_err(LD_BUG,"Error initializing keys; can't display fingerprint");
2095 return -1;
2097 if (!(k = get_identity_key())) {
2098 log_err(LD_GENERAL,"Error: missing identity key.");
2099 return -1;
2101 if (crypto_pk_get_fingerprint(k, buf, 1)<0) {
2102 log_err(LD_BUG, "Error computing fingerprint");
2103 return -1;
2105 printf("%s %s\n", nickname, buf);
2106 return 0;
2109 /** Entry point for password hashing: take the desired password from
2110 * the command line, and print its salted hash to stdout. **/
2111 /* static */ void
2112 do_hash_password(void)
2115 char output[256];
2116 char key[S2K_SPECIFIER_LEN+DIGEST_LEN];
2118 crypto_rand(key, S2K_SPECIFIER_LEN-1);
2119 key[S2K_SPECIFIER_LEN-1] = (uint8_t)96; /* Hash 64 K of data. */
2120 secret_to_key(key+S2K_SPECIFIER_LEN, DIGEST_LEN,
2121 get_options()->command_arg, strlen(get_options()->command_arg),
2122 key);
2123 base16_encode(output, sizeof(output), key, sizeof(key));
2124 printf("16:%s\n",output);
2127 #if defined (WINCE)
2129 find_flashcard_path(PWCHAR path, size_t size)
2131 WIN32_FIND_DATA d = {0};
2132 HANDLE h = NULL;
2134 if (!path)
2135 return -1;
2137 h = FindFirstFlashCard(&d);
2138 if (h == INVALID_HANDLE_VALUE)
2139 return -1;
2141 if (wcslen(d.cFileName) == 0) {
2142 FindClose(h);
2143 return -1;
2146 wcsncpy(path,d.cFileName,size);
2147 FindClose(h);
2148 return 0;
2150 #endif
2152 /** Main entry point for the Tor process. Called from main(). */
2153 /* This function is distinct from main() only so we can link main.c into
2154 * the unittest binary without conflicting with the unittests' main. */
2156 tor_main(int argc, char *argv[])
2158 int result = 0;
2159 #if defined (WINCE)
2160 WCHAR path [MAX_PATH] = {0};
2161 WCHAR fullpath [MAX_PATH] = {0};
2162 PWCHAR p = NULL;
2163 FILE* redir = NULL;
2164 FILE* redirdbg = NULL;
2166 // this is to facilitate debugging by opening
2167 // a file on a folder shared by the wm emulator.
2168 // if no flashcard (real or emulated) is present,
2169 // log files will be written in the root folder
2170 if (find_flashcard_path(path,MAX_PATH) == -1)
2172 redir = _wfreopen( L"\\stdout.log", L"w", stdout );
2173 redirdbg = _wfreopen( L"\\stderr.log", L"w", stderr );
2174 } else {
2175 swprintf(fullpath,L"\\%s\\tor",path);
2176 CreateDirectory(fullpath,NULL);
2178 swprintf(fullpath,L"\\%s\\tor\\stdout.log",path);
2179 redir = _wfreopen( fullpath, L"w", stdout );
2181 swprintf(fullpath,L"\\%s\\tor\\stderr.log",path);
2182 redirdbg = _wfreopen( fullpath, L"w", stderr );
2184 #endif
2186 update_approx_time(time(NULL));
2187 tor_threads_init();
2188 init_logging();
2189 #ifdef USE_DMALLOC
2191 /* Instruct OpenSSL to use our internal wrappers for malloc,
2192 realloc and free. */
2193 int r = CRYPTO_set_mem_ex_functions(_tor_malloc, _tor_realloc, _tor_free);
2194 tor_assert(r);
2196 #endif
2197 #ifdef NT_SERVICE
2199 int done = 0;
2200 result = nt_service_parse_options(argc, argv, &done);
2201 if (done) return result;
2203 #endif
2204 if (tor_init(argc, argv)<0)
2205 return -1;
2206 switch (get_options()->command) {
2207 case CMD_RUN_TOR:
2208 #ifdef NT_SERVICE
2209 nt_service_set_state(SERVICE_RUNNING);
2210 #endif
2211 result = do_main_loop();
2212 break;
2213 case CMD_LIST_FINGERPRINT:
2214 result = do_list_fingerprint();
2215 break;
2216 case CMD_HASH_PASSWORD:
2217 do_hash_password();
2218 result = 0;
2219 break;
2220 case CMD_VERIFY_CONFIG:
2221 printf("Configuration was valid\n");
2222 result = 0;
2223 break;
2224 case CMD_RUN_UNITTESTS: /* only set by test.c */
2225 default:
2226 log_warn(LD_BUG,"Illegal command number %d: internal error.",
2227 get_options()->command);
2228 result = -1;
2230 tor_cleanup();
2231 return result;