Dnsmasq v2.68 rc4
[tomato.git] / release / src / router / dnsmasq / src / forward.c
blobd967348e980556353648d7d7f2514df850526887
1 /* dnsmasq is Copyright (c) 2000-2013 Simon Kelley
3 This program is free software; you can redistribute it and/or modify
4 it under the terms of the GNU General Public License as published by
5 the Free Software Foundation; version 2 dated June, 1991, or
6 (at your option) version 3 dated 29 June, 2007.
8 This program is distributed in the hope that it will be useful,
9 but WITHOUT ANY WARRANTY; without even the implied warranty of
10 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11 GNU General Public License for more details.
13 You should have received a copy of the GNU General Public License
14 along with this program. If not, see <http://www.gnu.org/licenses/>.
17 #include "dnsmasq.h"
19 static struct frec *lookup_frec(unsigned short id, unsigned int crc);
20 static struct frec *lookup_frec_by_sender(unsigned short id,
21 union mysockaddr *addr,
22 unsigned int crc);
23 static unsigned short get_id(unsigned int crc);
24 static void free_frec(struct frec *f);
25 static struct randfd *allocate_rfd(int family);
27 /* Send a UDP packet with its source address set as "source"
28 unless nowild is true, when we just send it with the kernel default */
29 int send_from(int fd, int nowild, char *packet, size_t len,
30 union mysockaddr *to, struct all_addr *source,
31 unsigned int iface)
33 struct msghdr msg;
34 struct iovec iov[1];
35 union {
36 struct cmsghdr align; /* this ensures alignment */
37 #if defined(HAVE_LINUX_NETWORK)
38 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
39 #elif defined(IP_SENDSRCADDR)
40 char control[CMSG_SPACE(sizeof(struct in_addr))];
41 #endif
42 #ifdef HAVE_IPV6
43 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
44 #endif
45 } control_u;
47 iov[0].iov_base = packet;
48 iov[0].iov_len = len;
50 msg.msg_control = NULL;
51 msg.msg_controllen = 0;
52 msg.msg_flags = 0;
53 msg.msg_name = to;
54 msg.msg_namelen = sa_len(to);
55 msg.msg_iov = iov;
56 msg.msg_iovlen = 1;
58 if (!nowild)
60 struct cmsghdr *cmptr;
61 msg.msg_control = &control_u;
62 msg.msg_controllen = sizeof(control_u);
63 cmptr = CMSG_FIRSTHDR(&msg);
65 if (to->sa.sa_family == AF_INET)
67 #if defined(HAVE_LINUX_NETWORK)
68 struct in_pktinfo p;
69 p.ipi_ifindex = 0;
70 p.ipi_spec_dst = source->addr.addr4;
71 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
72 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_pktinfo));
73 cmptr->cmsg_level = IPPROTO_IP;
74 cmptr->cmsg_type = IP_PKTINFO;
75 #elif defined(IP_SENDSRCADDR)
76 memcpy(CMSG_DATA(cmptr), &(source->addr.addr4), sizeof(source->addr.addr4));
77 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_addr));
78 cmptr->cmsg_level = IPPROTO_IP;
79 cmptr->cmsg_type = IP_SENDSRCADDR;
80 #endif
82 else
83 #ifdef HAVE_IPV6
85 struct in6_pktinfo p;
86 p.ipi6_ifindex = iface; /* Need iface for IPv6 to handle link-local addrs */
87 p.ipi6_addr = source->addr.addr6;
88 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
89 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in6_pktinfo));
90 cmptr->cmsg_type = daemon->v6pktinfo;
91 cmptr->cmsg_level = IPPROTO_IPV6;
93 #else
94 (void)iface; /* eliminate warning */
95 #endif
98 while (sendmsg(fd, &msg, 0) == -1)
100 if (retry_send())
101 continue;
103 /* If interface is still in DAD, EINVAL results - ignore that. */
104 if (errno == EINVAL)
105 break;
107 my_syslog(LOG_ERR, _("failed to send packet: %s"), strerror(errno));
108 return 0;
111 return 1;
114 static unsigned int search_servers(time_t now, struct all_addr **addrpp,
115 unsigned int qtype, char *qdomain, int *type, char **domain, int *norebind)
118 /* If the query ends in the domain in one of our servers, set
119 domain to point to that name. We find the largest match to allow both
120 domain.org and sub.domain.org to exist. */
122 unsigned int namelen = strlen(qdomain);
123 unsigned int matchlen = 0;
124 struct server *serv;
125 unsigned int flags = 0;
127 for (serv = daemon->servers; serv; serv=serv->next)
128 /* domain matches take priority over NODOTS matches */
129 if ((serv->flags & SERV_FOR_NODOTS) && *type != SERV_HAS_DOMAIN && !strchr(qdomain, '.') && namelen != 0)
131 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
132 *type = SERV_FOR_NODOTS;
133 if (serv->flags & SERV_NO_ADDR)
134 flags = F_NXDOMAIN;
135 else if (serv->flags & SERV_LITERAL_ADDRESS)
137 if (sflag & qtype)
139 flags = sflag;
140 if (serv->addr.sa.sa_family == AF_INET)
141 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
142 #ifdef HAVE_IPV6
143 else
144 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
145 #endif
147 else if (!flags || (flags & F_NXDOMAIN))
148 flags = F_NOERR;
151 else if (serv->flags & SERV_HAS_DOMAIN)
153 unsigned int domainlen = strlen(serv->domain);
154 char *matchstart = qdomain + namelen - domainlen;
155 if (namelen >= domainlen &&
156 hostname_isequal(matchstart, serv->domain) &&
157 (domainlen == 0 || namelen == domainlen || *(matchstart-1) == '.' ))
159 if (serv->flags & SERV_NO_REBIND)
160 *norebind = 1;
161 else
163 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
164 /* implement priority rules for --address and --server for same domain.
165 --address wins if the address is for the correct AF
166 --server wins otherwise. */
167 if (domainlen != 0 && domainlen == matchlen)
169 if ((serv->flags & SERV_LITERAL_ADDRESS))
171 if (!(sflag & qtype) && flags == 0)
172 continue;
174 else
176 if (flags & (F_IPV4 | F_IPV6))
177 continue;
181 if (domainlen >= matchlen)
183 *type = serv->flags & (SERV_HAS_DOMAIN | SERV_USE_RESOLV | SERV_NO_REBIND);
184 *domain = serv->domain;
185 matchlen = domainlen;
186 if (serv->flags & SERV_NO_ADDR)
187 flags = F_NXDOMAIN;
188 else if (serv->flags & SERV_LITERAL_ADDRESS)
190 if (sflag & qtype)
192 flags = sflag;
193 if (serv->addr.sa.sa_family == AF_INET)
194 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
195 #ifdef HAVE_IPV6
196 else
197 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
198 #endif
200 else if (!flags || (flags & F_NXDOMAIN))
201 flags = F_NOERR;
203 else
204 flags = 0;
210 if (flags == 0 && !(qtype & F_QUERY) &&
211 option_bool(OPT_NODOTS_LOCAL) && !strchr(qdomain, '.') && namelen != 0)
212 /* don't forward A or AAAA queries for simple names, except the empty name */
213 flags = F_NOERR;
215 if (flags == F_NXDOMAIN && check_for_local_domain(qdomain, now))
216 flags = F_NOERR;
218 if (flags)
220 int logflags = 0;
222 if (flags == F_NXDOMAIN || flags == F_NOERR)
223 logflags = F_NEG | qtype;
225 log_query(logflags | flags | F_CONFIG | F_FORWARD, qdomain, *addrpp, NULL);
227 else if ((*type) & SERV_USE_RESOLV)
229 *type = 0; /* use normal servers for this domain */
230 *domain = NULL;
232 return flags;
235 static int forward_query(int udpfd, union mysockaddr *udpaddr,
236 struct all_addr *dst_addr, unsigned int dst_iface,
237 struct dns_header *header, size_t plen, time_t now, struct frec *forward)
239 char *domain = NULL;
240 int type = 0, norebind = 0;
241 struct all_addr *addrp = NULL;
242 unsigned int crc = questions_crc(header, plen, daemon->namebuff);
243 unsigned int flags = 0;
244 unsigned int gotname = extract_request(header, plen, daemon->namebuff, NULL);
245 struct server *start = NULL;
247 /* RFC 4035: sect 4.6 para 2 */
248 header->hb4 &= ~HB4_AD;
250 /* may be no servers available. */
251 if (!daemon->servers)
252 forward = NULL;
253 else if (forward || (forward = lookup_frec_by_sender(ntohs(header->id), udpaddr, crc)))
255 /* retry on existing query, send to all available servers */
256 domain = forward->sentto->domain;
257 forward->sentto->failed_queries++;
258 if (!option_bool(OPT_ORDER))
260 forward->forwardall = 1;
261 daemon->last_server = NULL;
263 type = forward->sentto->flags & SERV_TYPE;
264 if (!(start = forward->sentto->next))
265 start = daemon->servers; /* at end of list, recycle */
266 header->id = htons(forward->new_id);
268 else
270 if (gotname)
271 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
273 if (!flags && !(forward = get_new_frec(now, NULL)))
274 /* table full - server failure. */
275 flags = F_NEG;
277 if (forward)
279 forward->source = *udpaddr;
280 forward->dest = *dst_addr;
281 forward->iface = dst_iface;
282 forward->orig_id = ntohs(header->id);
283 forward->new_id = get_id(crc);
284 forward->fd = udpfd;
285 forward->crc = crc;
286 forward->forwardall = 0;
287 forward->flags = 0;
288 if (norebind)
289 forward->flags |= FREC_NOREBIND;
290 if (header->hb4 & HB4_CD)
291 forward->flags |= FREC_CHECKING_DISABLED;
293 header->id = htons(forward->new_id);
295 /* In strict_order mode, always try servers in the order
296 specified in resolv.conf, if a domain is given
297 always try all the available servers,
298 otherwise, use the one last known to work. */
300 if (type == 0)
302 if (option_bool(OPT_ORDER))
303 start = daemon->servers;
304 else if (!(start = daemon->last_server) ||
305 daemon->forwardcount++ > FORWARD_TEST ||
306 difftime(now, daemon->forwardtime) > FORWARD_TIME)
308 start = daemon->servers;
309 forward->forwardall = 1;
310 daemon->forwardcount = 0;
311 daemon->forwardtime = now;
314 else
316 start = daemon->servers;
317 if (!option_bool(OPT_ORDER))
318 forward->forwardall = 1;
323 /* check for send errors here (no route to host)
324 if we fail to send to all nameservers, send back an error
325 packet straight away (helps modem users when offline) */
327 if (!flags && forward)
329 struct server *firstsentto = start;
330 int forwarded = 0;
332 if (option_bool(OPT_ADD_MAC))
333 plen = add_mac(header, plen, ((char *) header) + PACKETSZ, &forward->source);
335 if (option_bool(OPT_CLIENT_SUBNET))
337 size_t new = add_source_addr(header, plen, ((char *) header) + PACKETSZ, &forward->source);
338 if (new != plen)
340 plen = new;
341 forward->flags |= FREC_HAS_SUBNET;
345 while (1)
347 /* only send to servers dealing with our domain.
348 domain may be NULL, in which case server->domain
349 must be NULL also. */
351 if (type == (start->flags & SERV_TYPE) &&
352 (type != SERV_HAS_DOMAIN || hostname_isequal(domain, start->domain)) &&
353 !(start->flags & SERV_LITERAL_ADDRESS))
355 int fd;
357 /* find server socket to use, may need to get random one. */
358 if (start->sfd)
359 fd = start->sfd->fd;
360 else
362 #ifdef HAVE_IPV6
363 if (start->addr.sa.sa_family == AF_INET6)
365 if (!forward->rfd6 &&
366 !(forward->rfd6 = allocate_rfd(AF_INET6)))
367 break;
368 daemon->rfd_save = forward->rfd6;
369 fd = forward->rfd6->fd;
371 else
372 #endif
374 if (!forward->rfd4 &&
375 !(forward->rfd4 = allocate_rfd(AF_INET)))
376 break;
377 daemon->rfd_save = forward->rfd4;
378 fd = forward->rfd4->fd;
381 #ifdef HAVE_CONNTRACK
382 /* Copy connection mark of incoming query to outgoing connection. */
383 if (option_bool(OPT_CONNTRACK))
385 unsigned int mark;
386 if (get_incoming_mark(&forward->source, &forward->dest, 0, &mark))
387 setsockopt(fd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
389 #endif
392 if (sendto(fd, (char *)header, plen, 0,
393 &start->addr.sa,
394 sa_len(&start->addr)) == -1)
396 if (retry_send())
397 continue;
399 else
401 /* Keep info in case we want to re-send this packet */
402 daemon->srv_save = start;
403 daemon->packet_len = plen;
405 if (!gotname)
406 strcpy(daemon->namebuff, "query");
407 if (start->addr.sa.sa_family == AF_INET)
408 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
409 (struct all_addr *)&start->addr.in.sin_addr, NULL);
410 #ifdef HAVE_IPV6
411 else
412 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
413 (struct all_addr *)&start->addr.in6.sin6_addr, NULL);
414 #endif
415 start->queries++;
416 forwarded = 1;
417 forward->sentto = start;
418 if (!forward->forwardall)
419 break;
420 forward->forwardall++;
424 if (!(start = start->next))
425 start = daemon->servers;
427 if (start == firstsentto)
428 break;
431 if (forwarded)
432 return 1;
434 /* could not send on, prepare to return */
435 header->id = htons(forward->orig_id);
436 free_frec(forward); /* cancel */
439 /* could not send on, return empty answer or address if known for whole domain */
440 if (udpfd != -1)
442 plen = setup_reply(header, plen, addrp, flags, daemon->local_ttl);
443 send_from(udpfd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND), (char *)header, plen, udpaddr, dst_addr, dst_iface);
446 return 0;
449 static size_t process_reply(struct dns_header *header, time_t now, struct server *server, size_t n, int check_rebind,
450 int checking_disabled, int check_subnet, union mysockaddr *query_source)
452 unsigned char *pheader, *sizep;
453 char **sets = 0;
454 int munged = 0, is_sign;
455 size_t plen;
457 #ifdef HAVE_IPSET
458 /* Similar algorithm to search_servers. */
459 struct ipsets *ipset_pos;
460 unsigned int namelen = strlen(daemon->namebuff);
461 unsigned int matchlen = 0;
462 for (ipset_pos = daemon->ipsets; ipset_pos; ipset_pos = ipset_pos->next)
464 unsigned int domainlen = strlen(ipset_pos->domain);
465 char *matchstart = daemon->namebuff + namelen - domainlen;
466 if (namelen >= domainlen && hostname_isequal(matchstart, ipset_pos->domain) &&
467 (domainlen == 0 || namelen == domainlen || *(matchstart - 1) == '.' ) &&
468 domainlen >= matchlen) {
469 matchlen = domainlen;
470 sets = ipset_pos->sets;
473 #endif
475 /* If upstream is advertising a larger UDP packet size
476 than we allow, trim it so that we don't get overlarge
477 requests for the client. We can't do this for signed packets. */
479 if ((pheader = find_pseudoheader(header, n, &plen, &sizep, &is_sign)))
481 if (!is_sign)
483 unsigned short udpsz;
484 unsigned char *psave = sizep;
486 GETSHORT(udpsz, sizep);
487 if (udpsz > daemon->edns_pktsz)
488 PUTSHORT(daemon->edns_pktsz, psave);
491 if (check_subnet && !check_source(header, plen, pheader, query_source))
493 my_syslog(LOG_WARNING, _("discarding DNS reply: subnet option mismatch"));
494 return 0;
499 /* RFC 4035 sect 4.6 para 3 */
500 if (!is_sign && !option_bool(OPT_DNSSEC))
501 header->hb4 &= ~HB4_AD;
503 if (OPCODE(header) != QUERY || (RCODE(header) != NOERROR && RCODE(header) != NXDOMAIN))
504 return n;
506 /* Complain loudly if the upstream server is non-recursive. */
507 if (!(header->hb4 & HB4_RA) && RCODE(header) == NOERROR && ntohs(header->ancount) == 0 &&
508 server && !(server->flags & SERV_WARNED_RECURSIVE))
510 prettyprint_addr(&server->addr, daemon->namebuff);
511 my_syslog(LOG_WARNING, _("nameserver %s refused to do a recursive query"), daemon->namebuff);
512 if (!option_bool(OPT_LOG))
513 server->flags |= SERV_WARNED_RECURSIVE;
516 if (daemon->bogus_addr && RCODE(header) != NXDOMAIN &&
517 check_for_bogus_wildcard(header, n, daemon->namebuff, daemon->bogus_addr, now))
519 munged = 1;
520 SET_RCODE(header, NXDOMAIN);
521 header->hb3 &= ~HB3_AA;
523 else
525 if (RCODE(header) == NXDOMAIN &&
526 extract_request(header, n, daemon->namebuff, NULL) &&
527 check_for_local_domain(daemon->namebuff, now))
529 /* if we forwarded a query for a locally known name (because it was for
530 an unknown type) and the answer is NXDOMAIN, convert that to NODATA,
531 since we know that the domain exists, even if upstream doesn't */
532 munged = 1;
533 header->hb3 |= HB3_AA;
534 SET_RCODE(header, NOERROR);
537 if (extract_addresses(header, n, daemon->namebuff, now, sets, is_sign, check_rebind, checking_disabled))
539 my_syslog(LOG_WARNING, _("possible DNS-rebind attack detected: %s"), daemon->namebuff);
540 munged = 1;
544 /* do this after extract_addresses. Ensure NODATA reply and remove
545 nameserver info. */
547 if (munged)
549 header->ancount = htons(0);
550 header->nscount = htons(0);
551 header->arcount = htons(0);
554 /* the bogus-nxdomain stuff, doctor and NXDOMAIN->NODATA munging can all elide
555 sections of the packet. Find the new length here and put back pseudoheader
556 if it was removed. */
557 return resize_packet(header, n, pheader, plen);
560 /* sets new last_server */
561 void reply_query(int fd, int family, time_t now)
563 /* packet from peer server, extract data for cache, and send to
564 original requester */
565 struct dns_header *header;
566 union mysockaddr serveraddr;
567 struct frec *forward;
568 socklen_t addrlen = sizeof(serveraddr);
569 ssize_t n = recvfrom(fd, daemon->packet, daemon->edns_pktsz, 0, &serveraddr.sa, &addrlen);
570 size_t nn;
571 struct server *server;
573 /* packet buffer overwritten */
574 daemon->srv_save = NULL;
576 /* Determine the address of the server replying so that we can mark that as good */
577 serveraddr.sa.sa_family = family;
578 #ifdef HAVE_IPV6
579 if (serveraddr.sa.sa_family == AF_INET6)
580 serveraddr.in6.sin6_flowinfo = 0;
581 #endif
583 /* spoof check: answer must come from known server, */
584 for (server = daemon->servers; server; server = server->next)
585 if (!(server->flags & (SERV_LITERAL_ADDRESS | SERV_NO_ADDR)) &&
586 sockaddr_isequal(&server->addr, &serveraddr))
587 break;
589 header = (struct dns_header *)daemon->packet;
591 if (!server ||
592 n < (int)sizeof(struct dns_header) || !(header->hb3 & HB3_QR) ||
593 !(forward = lookup_frec(ntohs(header->id), questions_crc(header, n, daemon->namebuff))))
594 return;
596 server = forward->sentto;
598 if ((RCODE(header) == SERVFAIL || RCODE(header) == REFUSED) &&
599 !option_bool(OPT_ORDER) &&
600 forward->forwardall == 0)
601 /* for broken servers, attempt to send to another one. */
603 unsigned char *pheader;
604 size_t plen;
605 int is_sign;
607 /* recreate query from reply */
608 pheader = find_pseudoheader(header, (size_t)n, &plen, NULL, &is_sign);
609 if (!is_sign)
611 header->ancount = htons(0);
612 header->nscount = htons(0);
613 header->arcount = htons(0);
614 if ((nn = resize_packet(header, (size_t)n, pheader, plen)))
616 header->hb3 &= ~(HB3_QR | HB3_TC);
617 forward_query(-1, NULL, NULL, 0, header, nn, now, forward);
618 return;
623 if ((forward->sentto->flags & SERV_TYPE) == 0)
625 if (RCODE(header) == SERVFAIL || RCODE(header) == REFUSED)
626 server = NULL;
627 else
629 struct server *last_server;
631 /* find good server by address if possible, otherwise assume the last one we sent to */
632 for (last_server = daemon->servers; last_server; last_server = last_server->next)
633 if (!(last_server->flags & (SERV_LITERAL_ADDRESS | SERV_HAS_DOMAIN | SERV_FOR_NODOTS | SERV_NO_ADDR)) &&
634 sockaddr_isequal(&last_server->addr, &serveraddr))
636 server = last_server;
637 break;
640 if (!option_bool(OPT_ALL_SERVERS))
641 daemon->last_server = server;
644 /* If the answer is an error, keep the forward record in place in case
645 we get a good reply from another server. Kill it when we've
646 had replies from all to avoid filling the forwarding table when
647 everything is broken */
648 if (forward->forwardall == 0 || --forward->forwardall == 1 ||
649 (RCODE(header) != REFUSED && RCODE(header) != SERVFAIL))
651 int check_rebind = !(forward->flags & FREC_NOREBIND);
653 if (!option_bool(OPT_NO_REBIND))
654 check_rebind = 0;
656 if ((nn = process_reply(header, now, server, (size_t)n, check_rebind, forward->flags & FREC_CHECKING_DISABLED,
657 forward->flags & FREC_HAS_SUBNET, &forward->source)))
659 header->id = htons(forward->orig_id);
660 header->hb4 |= HB4_RA; /* recursion if available */
661 send_from(forward->fd, option_bool(OPT_NOWILD) || option_bool (OPT_CLEVERBIND), daemon->packet, nn,
662 &forward->source, &forward->dest, forward->iface);
664 free_frec(forward); /* cancel */
669 void receive_query(struct listener *listen, time_t now)
671 struct dns_header *header = (struct dns_header *)daemon->packet;
672 union mysockaddr source_addr;
673 unsigned short type;
674 struct all_addr dst_addr;
675 struct in_addr netmask, dst_addr_4;
676 size_t m;
677 ssize_t n;
678 int if_index = 0, auth_dns = 0;
679 #ifdef HAVE_AUTH
680 int local_auth = 0;
681 #endif
682 struct iovec iov[1];
683 struct msghdr msg;
684 struct cmsghdr *cmptr;
685 union {
686 struct cmsghdr align; /* this ensures alignment */
687 #ifdef HAVE_IPV6
688 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
689 #endif
690 #if defined(HAVE_LINUX_NETWORK)
691 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
692 #elif defined(IP_RECVDSTADDR) && defined(HAVE_SOLARIS_NETWORK)
693 char control[CMSG_SPACE(sizeof(struct in_addr)) +
694 CMSG_SPACE(sizeof(unsigned int))];
695 #elif defined(IP_RECVDSTADDR)
696 char control[CMSG_SPACE(sizeof(struct in_addr)) +
697 CMSG_SPACE(sizeof(struct sockaddr_dl))];
698 #endif
699 } control_u;
701 /* packet buffer overwritten */
702 daemon->srv_save = NULL;
704 dst_addr_4.s_addr = 0;
705 netmask.s_addr = 0;
707 if (option_bool(OPT_NOWILD) && listen->iface)
709 auth_dns = listen->iface->dns_auth;
711 if (listen->family == AF_INET)
713 dst_addr_4 = listen->iface->addr.in.sin_addr;
714 netmask = listen->iface->netmask;
718 iov[0].iov_base = daemon->packet;
719 iov[0].iov_len = daemon->edns_pktsz;
721 msg.msg_control = control_u.control;
722 msg.msg_controllen = sizeof(control_u);
723 msg.msg_flags = 0;
724 msg.msg_name = &source_addr;
725 msg.msg_namelen = sizeof(source_addr);
726 msg.msg_iov = iov;
727 msg.msg_iovlen = 1;
729 if ((n = recvmsg(listen->fd, &msg, 0)) == -1)
730 return;
732 if (n < (int)sizeof(struct dns_header) ||
733 (msg.msg_flags & MSG_TRUNC) ||
734 (header->hb3 & HB3_QR))
735 return;
737 source_addr.sa.sa_family = listen->family;
738 #ifdef HAVE_IPV6
739 if (listen->family == AF_INET6)
740 source_addr.in6.sin6_flowinfo = 0;
741 #endif
743 if (!option_bool(OPT_NOWILD))
745 struct ifreq ifr;
747 if (msg.msg_controllen < sizeof(struct cmsghdr))
748 return;
750 #if defined(HAVE_LINUX_NETWORK)
751 if (listen->family == AF_INET)
752 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
753 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_PKTINFO)
755 union {
756 unsigned char *c;
757 struct in_pktinfo *p;
758 } p;
759 p.c = CMSG_DATA(cmptr);
760 dst_addr_4 = dst_addr.addr.addr4 = p.p->ipi_spec_dst;
761 if_index = p.p->ipi_ifindex;
763 #elif defined(IP_RECVDSTADDR) && defined(IP_RECVIF)
764 if (listen->family == AF_INET)
766 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
768 union {
769 unsigned char *c;
770 unsigned int *i;
771 struct in_addr *a;
772 #ifndef HAVE_SOLARIS_NETWORK
773 struct sockaddr_dl *s;
774 #endif
775 } p;
776 p.c = CMSG_DATA(cmptr);
777 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVDSTADDR)
778 dst_addr_4 = dst_addr.addr.addr4 = *(p.a);
779 else if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVIF)
780 #ifdef HAVE_SOLARIS_NETWORK
781 if_index = *(p.i);
782 #else
783 if_index = p.s->sdl_index;
784 #endif
787 #endif
789 #ifdef HAVE_IPV6
790 if (listen->family == AF_INET6)
792 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
793 if (cmptr->cmsg_level == IPPROTO_IPV6 && cmptr->cmsg_type == daemon->v6pktinfo)
795 union {
796 unsigned char *c;
797 struct in6_pktinfo *p;
798 } p;
799 p.c = CMSG_DATA(cmptr);
801 dst_addr.addr.addr6 = p.p->ipi6_addr;
802 if_index = p.p->ipi6_ifindex;
805 #endif
807 /* enforce available interface configuration */
809 if (!indextoname(listen->fd, if_index, ifr.ifr_name))
810 return;
812 if (!iface_check(listen->family, &dst_addr, ifr.ifr_name, &auth_dns))
814 if (!option_bool(OPT_CLEVERBIND))
815 enumerate_interfaces(0);
816 if (!loopback_exception(listen->fd, listen->family, &dst_addr, ifr.ifr_name) &&
817 !label_exception(if_index, listen->family, &dst_addr))
818 return;
821 if (listen->family == AF_INET && option_bool(OPT_LOCALISE))
823 struct irec *iface;
825 /* get the netmask of the interface whch has the address we were sent to.
826 This is no neccessarily the interface we arrived on. */
828 for (iface = daemon->interfaces; iface; iface = iface->next)
829 if (iface->addr.sa.sa_family == AF_INET &&
830 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
831 break;
833 /* interface may be new */
834 if (!iface && !option_bool(OPT_CLEVERBIND))
835 enumerate_interfaces(0);
837 for (iface = daemon->interfaces; iface; iface = iface->next)
838 if (iface->addr.sa.sa_family == AF_INET &&
839 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
840 break;
842 /* If we failed, abandon localisation */
843 if (iface)
844 netmask = iface->netmask;
845 else
846 dst_addr_4.s_addr = 0;
850 if (extract_request(header, (size_t)n, daemon->namebuff, &type))
852 char types[20];
853 #ifdef HAVE_AUTH
854 struct auth_zone *zone;
855 #endif
857 querystr(auth_dns ? "auth" : "query", types, type);
859 if (listen->family == AF_INET)
860 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
861 (struct all_addr *)&source_addr.in.sin_addr, types);
862 #ifdef HAVE_IPV6
863 else
864 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
865 (struct all_addr *)&source_addr.in6.sin6_addr, types);
866 #endif
868 #ifdef HAVE_AUTH
869 /* find queries for zones we're authoritative for, and answer them directly */
870 if (!auth_dns)
871 for (zone = daemon->auth_zones; zone; zone = zone->next)
872 if (in_zone(zone, daemon->namebuff, NULL))
874 auth_dns = 1;
875 local_auth = 1;
876 break;
878 #endif
881 #ifdef HAVE_AUTH
882 if (auth_dns)
884 m = answer_auth(header, ((char *) header) + PACKETSZ, (size_t)n, now, &source_addr, local_auth);
885 if (m >= 1)
887 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
888 (char *)header, m, &source_addr, &dst_addr, if_index);
889 daemon->auth_answer++;
892 else
893 #endif
895 m = answer_request(header, ((char *) header) + PACKETSZ, (size_t)n,
896 dst_addr_4, netmask, now);
898 if (m >= 1)
900 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
901 (char *)header, m, &source_addr, &dst_addr, if_index);
902 daemon->local_answer++;
904 else if (forward_query(listen->fd, &source_addr, &dst_addr, if_index,
905 header, (size_t)n, now, NULL))
906 daemon->queries_forwarded++;
907 else
908 daemon->local_answer++;
912 /* The daemon forks before calling this: it should deal with one connection,
913 blocking as neccessary, and then return. Note, need to be a bit careful
914 about resources for debug mode, when the fork is suppressed: that's
915 done by the caller. */
916 unsigned char *tcp_request(int confd, time_t now,
917 union mysockaddr *local_addr, struct in_addr netmask, int auth_dns)
919 size_t size = 0;
920 int norebind = 0;
921 #ifdef HAVE_AUTH
922 int local_auth = 0;
923 #endif
924 int checking_disabled, check_subnet;
925 size_t m;
926 unsigned short qtype;
927 unsigned int gotname;
928 unsigned char c1, c2;
929 /* Max TCP packet + slop + size */
930 unsigned char *packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16));
931 unsigned char *payload = &packet[2];
932 /* largest field in header is 16-bits, so this is still sufficiently aligned */
933 struct dns_header *header = (struct dns_header *)payload;
934 u16 *length = (u16 *)packet;
935 struct server *last_server;
936 struct in_addr dst_addr_4;
937 union mysockaddr peer_addr;
938 socklen_t peer_len = sizeof(union mysockaddr);
940 if (getpeername(confd, (struct sockaddr *)&peer_addr, &peer_len) == -1)
941 return packet;
943 while (1)
945 if (!packet ||
946 !read_write(confd, &c1, 1, 1) || !read_write(confd, &c2, 1, 1) ||
947 !(size = c1 << 8 | c2) ||
948 !read_write(confd, payload, size, 1))
949 return packet;
951 if (size < (int)sizeof(struct dns_header))
952 continue;
954 check_subnet = 0;
956 /* save state of "cd" flag in query */
957 checking_disabled = header->hb4 & HB4_CD;
959 /* RFC 4035: sect 4.6 para 2 */
960 header->hb4 &= ~HB4_AD;
962 if ((gotname = extract_request(header, (unsigned int)size, daemon->namebuff, &qtype)))
964 char types[20];
965 #ifdef HAVE_AUTH
966 struct auth_zone *zone;
967 #endif
968 querystr(auth_dns ? "auth" : "query", types, qtype);
970 if (peer_addr.sa.sa_family == AF_INET)
971 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
972 (struct all_addr *)&peer_addr.in.sin_addr, types);
973 #ifdef HAVE_IPV6
974 else
975 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
976 (struct all_addr *)&peer_addr.in6.sin6_addr, types);
977 #endif
979 #ifdef HAVE_AUTH
980 /* find queries for zones we're authoritative for, and answer them directly */
981 if (!auth_dns)
982 for (zone = daemon->auth_zones; zone; zone = zone->next)
983 if (in_zone(zone, daemon->namebuff, NULL))
985 auth_dns = 1;
986 local_auth = 1;
987 break;
989 #endif
992 if (local_addr->sa.sa_family == AF_INET)
993 dst_addr_4 = local_addr->in.sin_addr;
994 else
995 dst_addr_4.s_addr = 0;
997 #ifdef HAVE_AUTH
998 if (auth_dns)
999 m = answer_auth(header, ((char *) header) + 65536, (size_t)size, now, &peer_addr, local_auth);
1000 else
1001 #endif
1003 /* m > 0 if answered from cache */
1004 m = answer_request(header, ((char *) header) + 65536, (size_t)size,
1005 dst_addr_4, netmask, now);
1007 /* Do this by steam now we're not in the select() loop */
1008 check_log_writer(NULL);
1010 if (m == 0)
1012 unsigned int flags = 0;
1013 struct all_addr *addrp = NULL;
1014 int type = 0;
1015 char *domain = NULL;
1017 if (option_bool(OPT_ADD_MAC))
1018 size = add_mac(header, size, ((char *) header) + 65536, &peer_addr);
1020 if (option_bool(OPT_CLIENT_SUBNET))
1022 size_t new = add_source_addr(header, size, ((char *) header) + 65536, &peer_addr);
1023 if (size != new)
1025 size = new;
1026 check_subnet = 1;
1030 if (gotname)
1031 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
1033 if (type != 0 || option_bool(OPT_ORDER) || !daemon->last_server)
1034 last_server = daemon->servers;
1035 else
1036 last_server = daemon->last_server;
1038 if (!flags && last_server)
1040 struct server *firstsendto = NULL;
1041 unsigned int crc = questions_crc(header, (unsigned int)size, daemon->namebuff);
1043 /* Loop round available servers until we succeed in connecting to one.
1044 Note that this code subtley ensures that consecutive queries on this connection
1045 which can go to the same server, do so. */
1046 while (1)
1048 if (!firstsendto)
1049 firstsendto = last_server;
1050 else
1052 if (!(last_server = last_server->next))
1053 last_server = daemon->servers;
1055 if (last_server == firstsendto)
1056 break;
1059 /* server for wrong domain */
1060 if (type != (last_server->flags & SERV_TYPE) ||
1061 (type == SERV_HAS_DOMAIN && !hostname_isequal(domain, last_server->domain)))
1062 continue;
1064 if (last_server->tcpfd == -1)
1066 if ((last_server->tcpfd = socket(last_server->addr.sa.sa_family, SOCK_STREAM, 0)) == -1)
1067 continue;
1069 if ((!local_bind(last_server->tcpfd, &last_server->source_addr, last_server->interface, 1) ||
1070 connect(last_server->tcpfd, &last_server->addr.sa, sa_len(&last_server->addr)) == -1))
1072 close(last_server->tcpfd);
1073 last_server->tcpfd = -1;
1074 continue;
1077 #ifdef HAVE_CONNTRACK
1078 /* Copy connection mark of incoming query to outgoing connection. */
1079 if (option_bool(OPT_CONNTRACK))
1081 unsigned int mark;
1082 struct all_addr local;
1083 #ifdef HAVE_IPV6
1084 if (local_addr->sa.sa_family == AF_INET6)
1085 local.addr.addr6 = local_addr->in6.sin6_addr;
1086 else
1087 #endif
1088 local.addr.addr4 = local_addr->in.sin_addr;
1090 if (get_incoming_mark(&peer_addr, &local, 1, &mark))
1091 setsockopt(last_server->tcpfd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
1093 #endif
1096 *length = htons(size);
1098 if (!read_write(last_server->tcpfd, packet, size + sizeof(u16), 0) ||
1099 !read_write(last_server->tcpfd, &c1, 1, 1) ||
1100 !read_write(last_server->tcpfd, &c2, 1, 1))
1102 close(last_server->tcpfd);
1103 last_server->tcpfd = -1;
1104 continue;
1107 m = (c1 << 8) | c2;
1108 if (!read_write(last_server->tcpfd, payload, m, 1))
1109 return packet;
1111 if (!gotname)
1112 strcpy(daemon->namebuff, "query");
1113 if (last_server->addr.sa.sa_family == AF_INET)
1114 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
1115 (struct all_addr *)&last_server->addr.in.sin_addr, NULL);
1116 #ifdef HAVE_IPV6
1117 else
1118 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
1119 (struct all_addr *)&last_server->addr.in6.sin6_addr, NULL);
1120 #endif
1122 /* There's no point in updating the cache, since this process will exit and
1123 lose the information after a few queries. We make this call for the alias and
1124 bogus-nxdomain side-effects. */
1125 /* If the crc of the question section doesn't match the crc we sent, then
1126 someone might be attempting to insert bogus values into the cache by
1127 sending replies containing questions and bogus answers. */
1128 if (crc == questions_crc(header, (unsigned int)m, daemon->namebuff))
1129 m = process_reply(header, now, last_server, (unsigned int)m,
1130 option_bool(OPT_NO_REBIND) && !norebind, checking_disabled,
1131 check_subnet, &peer_addr);
1133 break;
1137 /* In case of local answer or no connections made. */
1138 if (m == 0)
1139 m = setup_reply(header, (unsigned int)size, addrp, flags, daemon->local_ttl);
1143 check_log_writer(NULL);
1145 *length = htons(m);
1147 if (m == 0 || !read_write(confd, packet, m + sizeof(u16), 0))
1148 return packet;
1152 static struct frec *allocate_frec(time_t now)
1154 struct frec *f;
1156 if ((f = (struct frec *)whine_malloc(sizeof(struct frec))))
1158 f->next = daemon->frec_list;
1159 f->time = now;
1160 f->sentto = NULL;
1161 f->rfd4 = NULL;
1162 f->flags = 0;
1163 #ifdef HAVE_IPV6
1164 f->rfd6 = NULL;
1165 #endif
1166 daemon->frec_list = f;
1169 return f;
1172 static struct randfd *allocate_rfd(int family)
1174 static int finger = 0;
1175 int i;
1177 /* limit the number of sockets we have open to avoid starvation of
1178 (eg) TFTP. Once we have a reasonable number, randomness should be OK */
1180 for (i = 0; i < RANDOM_SOCKS; i++)
1181 if (daemon->randomsocks[i].refcount == 0)
1183 if ((daemon->randomsocks[i].fd = random_sock(family)) == -1)
1184 break;
1186 daemon->randomsocks[i].refcount = 1;
1187 daemon->randomsocks[i].family = family;
1188 return &daemon->randomsocks[i];
1191 /* No free ones or cannot get new socket, grab an existing one */
1192 for (i = 0; i < RANDOM_SOCKS; i++)
1194 int j = (i+finger) % RANDOM_SOCKS;
1195 if (daemon->randomsocks[j].refcount != 0 &&
1196 daemon->randomsocks[j].family == family &&
1197 daemon->randomsocks[j].refcount != 0xffff)
1199 finger = j;
1200 daemon->randomsocks[j].refcount++;
1201 return &daemon->randomsocks[j];
1205 return NULL; /* doom */
1208 static void free_frec(struct frec *f)
1210 if (f->rfd4 && --(f->rfd4->refcount) == 0)
1211 close(f->rfd4->fd);
1213 f->rfd4 = NULL;
1214 f->sentto = NULL;
1215 f->flags = 0;
1217 #ifdef HAVE_IPV6
1218 if (f->rfd6 && --(f->rfd6->refcount) == 0)
1219 close(f->rfd6->fd);
1221 f->rfd6 = NULL;
1222 #endif
1225 /* if wait==NULL return a free or older than TIMEOUT record.
1226 else return *wait zero if one available, or *wait is delay to
1227 when the oldest in-use record will expire. Impose an absolute
1228 limit of 4*TIMEOUT before we wipe things (for random sockets) */
1229 struct frec *get_new_frec(time_t now, int *wait)
1231 struct frec *f, *oldest, *target;
1232 int count;
1234 if (wait)
1235 *wait = 0;
1237 for (f = daemon->frec_list, oldest = NULL, target = NULL, count = 0; f; f = f->next, count++)
1238 if (!f->sentto)
1239 target = f;
1240 else
1242 if (difftime(now, f->time) >= 4*TIMEOUT)
1244 free_frec(f);
1245 target = f;
1248 if (!oldest || difftime(f->time, oldest->time) <= 0)
1249 oldest = f;
1252 if (target)
1254 target->time = now;
1255 return target;
1258 /* can't find empty one, use oldest if there is one
1259 and it's older than timeout */
1260 if (oldest && ((int)difftime(now, oldest->time)) >= TIMEOUT)
1262 /* keep stuff for twice timeout if we can by allocating a new
1263 record instead */
1264 if (difftime(now, oldest->time) < 2*TIMEOUT &&
1265 count <= daemon->ftabsize &&
1266 (f = allocate_frec(now)))
1267 return f;
1269 if (!wait)
1271 free_frec(oldest);
1272 oldest->time = now;
1274 return oldest;
1277 /* none available, calculate time 'till oldest record expires */
1278 if (count > daemon->ftabsize)
1280 static time_t last_log = 0;
1282 if (oldest && wait)
1283 *wait = oldest->time + (time_t)TIMEOUT - now;
1285 if ((int)difftime(now, last_log) > 5)
1287 last_log = now;
1288 my_syslog(LOG_WARNING, _("Maximum number of concurrent DNS queries reached (max: %d)"), daemon->ftabsize);
1291 return NULL;
1294 if (!(f = allocate_frec(now)) && wait)
1295 /* wait one second on malloc failure */
1296 *wait = 1;
1298 return f; /* OK if malloc fails and this is NULL */
1301 /* crc is all-ones if not known. */
1302 static struct frec *lookup_frec(unsigned short id, unsigned int crc)
1304 struct frec *f;
1306 for(f = daemon->frec_list; f; f = f->next)
1307 if (f->sentto && f->new_id == id &&
1308 (f->crc == crc || crc == 0xffffffff))
1309 return f;
1311 return NULL;
1314 static struct frec *lookup_frec_by_sender(unsigned short id,
1315 union mysockaddr *addr,
1316 unsigned int crc)
1318 struct frec *f;
1320 for(f = daemon->frec_list; f; f = f->next)
1321 if (f->sentto &&
1322 f->orig_id == id &&
1323 f->crc == crc &&
1324 sockaddr_isequal(&f->source, addr))
1325 return f;
1327 return NULL;
1330 /* A server record is going away, remove references to it */
1331 void server_gone(struct server *server)
1333 struct frec *f;
1335 for (f = daemon->frec_list; f; f = f->next)
1336 if (f->sentto && f->sentto == server)
1337 free_frec(f);
1339 if (daemon->last_server == server)
1340 daemon->last_server = NULL;
1342 if (daemon->srv_save == server)
1343 daemon->srv_save = NULL;
1346 /* return unique random ids. */
1347 static unsigned short get_id(unsigned int crc)
1349 unsigned short ret = 0;
1352 ret = rand16();
1353 while (lookup_frec(ret, crc));
1355 return ret;