]> git.ipfire.org Git - people/ms/dnsmasq.git/blob - src/forward.c
Update copyright for 2014.
[people/ms/dnsmasq.git] / src / forward.c
1 /* dnsmasq is Copyright (c) 2000-2014 Simon Kelley
2
3 This program is free software; you can redistribute it and/or modify
4 it under the terms of the GNU General Public License as published by
5 the Free Software Foundation; version 2 dated June, 1991, or
6 (at your option) version 3 dated 29 June, 2007.
7
8 This program is distributed in the hope that it will be useful,
9 but WITHOUT ANY WARRANTY; without even the implied warranty of
10 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11 GNU General Public License for more details.
12
13 You should have received a copy of the GNU General Public License
14 along with this program. If not, see <http://www.gnu.org/licenses/>.
15 */
16
17 #include "dnsmasq.h"
18
19 static struct frec *lookup_frec(unsigned short id, unsigned int crc);
20 static struct frec *lookup_frec_by_sender(unsigned short id,
21 union mysockaddr *addr,
22 unsigned int crc);
23 static unsigned short get_id(unsigned int crc);
24 static void free_frec(struct frec *f);
25 static struct randfd *allocate_rfd(int family);
26
27 /* Send a UDP packet with its source address set as "source"
28 unless nowild is true, when we just send it with the kernel default */
29 int send_from(int fd, int nowild, char *packet, size_t len,
30 union mysockaddr *to, struct all_addr *source,
31 unsigned int iface)
32 {
33 struct msghdr msg;
34 struct iovec iov[1];
35 union {
36 struct cmsghdr align; /* this ensures alignment */
37 #if defined(HAVE_LINUX_NETWORK)
38 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
39 #elif defined(IP_SENDSRCADDR)
40 char control[CMSG_SPACE(sizeof(struct in_addr))];
41 #endif
42 #ifdef HAVE_IPV6
43 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
44 #endif
45 } control_u;
46
47 iov[0].iov_base = packet;
48 iov[0].iov_len = len;
49
50 msg.msg_control = NULL;
51 msg.msg_controllen = 0;
52 msg.msg_flags = 0;
53 msg.msg_name = to;
54 msg.msg_namelen = sa_len(to);
55 msg.msg_iov = iov;
56 msg.msg_iovlen = 1;
57
58 if (!nowild)
59 {
60 struct cmsghdr *cmptr;
61 msg.msg_control = &control_u;
62 msg.msg_controllen = sizeof(control_u);
63 cmptr = CMSG_FIRSTHDR(&msg);
64
65 if (to->sa.sa_family == AF_INET)
66 {
67 #if defined(HAVE_LINUX_NETWORK)
68 struct in_pktinfo p;
69 p.ipi_ifindex = 0;
70 p.ipi_spec_dst = source->addr.addr4;
71 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
72 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_pktinfo));
73 cmptr->cmsg_level = IPPROTO_IP;
74 cmptr->cmsg_type = IP_PKTINFO;
75 #elif defined(IP_SENDSRCADDR)
76 memcpy(CMSG_DATA(cmptr), &(source->addr.addr4), sizeof(source->addr.addr4));
77 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_addr));
78 cmptr->cmsg_level = IPPROTO_IP;
79 cmptr->cmsg_type = IP_SENDSRCADDR;
80 #endif
81 }
82 else
83 #ifdef HAVE_IPV6
84 {
85 struct in6_pktinfo p;
86 p.ipi6_ifindex = iface; /* Need iface for IPv6 to handle link-local addrs */
87 p.ipi6_addr = source->addr.addr6;
88 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
89 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in6_pktinfo));
90 cmptr->cmsg_type = daemon->v6pktinfo;
91 cmptr->cmsg_level = IPPROTO_IPV6;
92 }
93 #else
94 (void)iface; /* eliminate warning */
95 #endif
96 }
97
98 while (sendmsg(fd, &msg, 0) == -1)
99 {
100 if (retry_send())
101 continue;
102
103 /* If interface is still in DAD, EINVAL results - ignore that. */
104 if (errno == EINVAL)
105 break;
106
107 my_syslog(LOG_ERR, _("failed to send packet: %s"), strerror(errno));
108 return 0;
109 }
110
111 return 1;
112 }
113
114 static unsigned int search_servers(time_t now, struct all_addr **addrpp,
115 unsigned int qtype, char *qdomain, int *type, char **domain, int *norebind)
116
117 {
118 /* If the query ends in the domain in one of our servers, set
119 domain to point to that name. We find the largest match to allow both
120 domain.org and sub.domain.org to exist. */
121
122 unsigned int namelen = strlen(qdomain);
123 unsigned int matchlen = 0;
124 struct server *serv;
125 unsigned int flags = 0;
126
127 for (serv = daemon->servers; serv; serv=serv->next)
128 /* domain matches take priority over NODOTS matches */
129 if ((serv->flags & SERV_FOR_NODOTS) && *type != SERV_HAS_DOMAIN && !strchr(qdomain, '.') && namelen != 0)
130 {
131 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
132 *type = SERV_FOR_NODOTS;
133 if (serv->flags & SERV_NO_ADDR)
134 flags = F_NXDOMAIN;
135 else if (serv->flags & SERV_LITERAL_ADDRESS)
136 {
137 if (sflag & qtype)
138 {
139 flags = sflag;
140 if (serv->addr.sa.sa_family == AF_INET)
141 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
142 #ifdef HAVE_IPV6
143 else
144 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
145 #endif
146 }
147 else if (!flags || (flags & F_NXDOMAIN))
148 flags = F_NOERR;
149 }
150 }
151 else if (serv->flags & SERV_HAS_DOMAIN)
152 {
153 unsigned int domainlen = strlen(serv->domain);
154 char *matchstart = qdomain + namelen - domainlen;
155 if (namelen >= domainlen &&
156 hostname_isequal(matchstart, serv->domain) &&
157 (domainlen == 0 || namelen == domainlen || *(matchstart-1) == '.' ))
158 {
159 if (serv->flags & SERV_NO_REBIND)
160 *norebind = 1;
161 else
162 {
163 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
164 /* implement priority rules for --address and --server for same domain.
165 --address wins if the address is for the correct AF
166 --server wins otherwise. */
167 if (domainlen != 0 && domainlen == matchlen)
168 {
169 if ((serv->flags & SERV_LITERAL_ADDRESS))
170 {
171 if (!(sflag & qtype) && flags == 0)
172 continue;
173 }
174 else
175 {
176 if (flags & (F_IPV4 | F_IPV6))
177 continue;
178 }
179 }
180
181 if (domainlen >= matchlen)
182 {
183 *type = serv->flags & (SERV_HAS_DOMAIN | SERV_USE_RESOLV | SERV_NO_REBIND);
184 *domain = serv->domain;
185 matchlen = domainlen;
186 if (serv->flags & SERV_NO_ADDR)
187 flags = F_NXDOMAIN;
188 else if (serv->flags & SERV_LITERAL_ADDRESS)
189 {
190 if (sflag & qtype)
191 {
192 flags = sflag;
193 if (serv->addr.sa.sa_family == AF_INET)
194 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
195 #ifdef HAVE_IPV6
196 else
197 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
198 #endif
199 }
200 else if (!flags || (flags & F_NXDOMAIN))
201 flags = F_NOERR;
202 }
203 else
204 flags = 0;
205 }
206 }
207 }
208 }
209
210 if (flags == 0 && !(qtype & F_QUERY) &&
211 option_bool(OPT_NODOTS_LOCAL) && !strchr(qdomain, '.') && namelen != 0)
212 /* don't forward A or AAAA queries for simple names, except the empty name */
213 flags = F_NOERR;
214
215 if (flags == F_NXDOMAIN && check_for_local_domain(qdomain, now))
216 flags = F_NOERR;
217
218 if (flags)
219 {
220 int logflags = 0;
221
222 if (flags == F_NXDOMAIN || flags == F_NOERR)
223 logflags = F_NEG | qtype;
224
225 log_query(logflags | flags | F_CONFIG | F_FORWARD, qdomain, *addrpp, NULL);
226 }
227 else if ((*type) & SERV_USE_RESOLV)
228 {
229 *type = 0; /* use normal servers for this domain */
230 *domain = NULL;
231 }
232 return flags;
233 }
234
235 static int forward_query(int udpfd, union mysockaddr *udpaddr,
236 struct all_addr *dst_addr, unsigned int dst_iface,
237 struct dns_header *header, size_t plen, time_t now, struct frec *forward)
238 {
239 char *domain = NULL;
240 int type = 0, norebind = 0;
241 struct all_addr *addrp = NULL;
242 unsigned int crc = questions_crc(header, plen, daemon->namebuff);
243 unsigned int flags = 0;
244 unsigned int gotname = extract_request(header, plen, daemon->namebuff, NULL);
245 struct server *start = NULL;
246
247 /* RFC 4035: sect 4.6 para 2 */
248 header->hb4 &= ~HB4_AD;
249
250 /* may be no servers available. */
251 if (!daemon->servers)
252 forward = NULL;
253 else if (forward || (forward = lookup_frec_by_sender(ntohs(header->id), udpaddr, crc)))
254 {
255 /* retry on existing query, send to all available servers */
256 domain = forward->sentto->domain;
257 forward->sentto->failed_queries++;
258 if (!option_bool(OPT_ORDER))
259 {
260 forward->forwardall = 1;
261 daemon->last_server = NULL;
262 }
263 type = forward->sentto->flags & SERV_TYPE;
264 if (!(start = forward->sentto->next))
265 start = daemon->servers; /* at end of list, recycle */
266 header->id = htons(forward->new_id);
267 }
268 else
269 {
270 if (gotname)
271 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
272
273 if (!flags && !(forward = get_new_frec(now, NULL, 0)))
274 /* table full - server failure. */
275 flags = F_NEG;
276
277 if (forward)
278 {
279 forward->source = *udpaddr;
280 forward->dest = *dst_addr;
281 forward->iface = dst_iface;
282 forward->orig_id = ntohs(header->id);
283 forward->new_id = get_id(crc);
284 forward->fd = udpfd;
285 forward->crc = crc;
286 forward->forwardall = 0;
287 forward->flags = 0;
288 if (norebind)
289 forward->flags |= FREC_NOREBIND;
290 if (header->hb4 & HB4_CD)
291 forward->flags |= FREC_CHECKING_DISABLED;
292
293 header->id = htons(forward->new_id);
294
295 /* In strict_order mode, always try servers in the order
296 specified in resolv.conf, if a domain is given
297 always try all the available servers,
298 otherwise, use the one last known to work. */
299
300 if (type == 0)
301 {
302 if (option_bool(OPT_ORDER))
303 start = daemon->servers;
304 else if (!(start = daemon->last_server) ||
305 daemon->forwardcount++ > FORWARD_TEST ||
306 difftime(now, daemon->forwardtime) > FORWARD_TIME)
307 {
308 start = daemon->servers;
309 forward->forwardall = 1;
310 daemon->forwardcount = 0;
311 daemon->forwardtime = now;
312 }
313 }
314 else
315 {
316 start = daemon->servers;
317 if (!option_bool(OPT_ORDER))
318 forward->forwardall = 1;
319 }
320 }
321 }
322
323 /* check for send errors here (no route to host)
324 if we fail to send to all nameservers, send back an error
325 packet straight away (helps modem users when offline) */
326
327 if (!flags && forward)
328 {
329 struct server *firstsentto = start;
330 int forwarded = 0;
331
332 if (option_bool(OPT_ADD_MAC))
333 plen = add_mac(header, plen, ((char *) header) + daemon->packet_buff_sz, &forward->source);
334
335 if (option_bool(OPT_CLIENT_SUBNET))
336 {
337 size_t new = add_source_addr(header, plen, ((char *) header) + daemon->packet_buff_sz, &forward->source);
338 if (new != plen)
339 {
340 plen = new;
341 forward->flags |= FREC_HAS_SUBNET;
342 }
343 }
344
345 #ifdef HAVE_DNSSEC
346 if (option_bool(OPT_DNSSEC_VALID))
347 {
348 plen = add_do_bit(header, plen, ((char *) header) + daemon->packet_buff_sz);
349 header->hb4 |= HB4_CD;
350 }
351 #endif
352
353 while (1)
354 {
355 /* only send to servers dealing with our domain.
356 domain may be NULL, in which case server->domain
357 must be NULL also. */
358
359 if (type == (start->flags & SERV_TYPE) &&
360 (type != SERV_HAS_DOMAIN || hostname_isequal(domain, start->domain)) &&
361 !(start->flags & SERV_LITERAL_ADDRESS))
362 {
363 int fd;
364
365 /* find server socket to use, may need to get random one. */
366 if (start->sfd)
367 fd = start->sfd->fd;
368 else
369 {
370 #ifdef HAVE_IPV6
371 if (start->addr.sa.sa_family == AF_INET6)
372 {
373 if (!forward->rfd6 &&
374 !(forward->rfd6 = allocate_rfd(AF_INET6)))
375 break;
376 daemon->rfd_save = forward->rfd6;
377 fd = forward->rfd6->fd;
378 }
379 else
380 #endif
381 {
382 if (!forward->rfd4 &&
383 !(forward->rfd4 = allocate_rfd(AF_INET)))
384 break;
385 daemon->rfd_save = forward->rfd4;
386 fd = forward->rfd4->fd;
387 }
388
389 #ifdef HAVE_CONNTRACK
390 /* Copy connection mark of incoming query to outgoing connection. */
391 if (option_bool(OPT_CONNTRACK))
392 {
393 unsigned int mark;
394 if (get_incoming_mark(&forward->source, &forward->dest, 0, &mark))
395 setsockopt(fd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
396 }
397 #endif
398 }
399
400 if (sendto(fd, (char *)header, plen, 0,
401 &start->addr.sa,
402 sa_len(&start->addr)) == -1)
403 {
404 if (retry_send())
405 continue;
406 }
407 else
408 {
409 /* Keep info in case we want to re-send this packet */
410 daemon->srv_save = start;
411 daemon->packet_len = plen;
412
413 if (!gotname)
414 strcpy(daemon->namebuff, "query");
415 if (start->addr.sa.sa_family == AF_INET)
416 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
417 (struct all_addr *)&start->addr.in.sin_addr, NULL);
418 #ifdef HAVE_IPV6
419 else
420 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
421 (struct all_addr *)&start->addr.in6.sin6_addr, NULL);
422 #endif
423 start->queries++;
424 forwarded = 1;
425 forward->sentto = start;
426 if (!forward->forwardall)
427 break;
428 forward->forwardall++;
429 }
430 }
431
432 if (!(start = start->next))
433 start = daemon->servers;
434
435 if (start == firstsentto)
436 break;
437 }
438
439 if (forwarded)
440 return 1;
441
442 /* could not send on, prepare to return */
443 header->id = htons(forward->orig_id);
444 free_frec(forward); /* cancel */
445 }
446
447 /* could not send on, return empty answer or address if known for whole domain */
448 if (udpfd != -1)
449 {
450 plen = setup_reply(header, plen, addrp, flags, daemon->local_ttl);
451 send_from(udpfd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND), (char *)header, plen, udpaddr, dst_addr, dst_iface);
452 }
453
454 return 0;
455 }
456
457 static size_t process_reply(struct dns_header *header, time_t now, struct server *server, size_t n, int check_rebind,
458 int no_cache, int cache_secure, int check_subnet, union mysockaddr *query_source)
459 {
460 unsigned char *pheader, *sizep;
461 char **sets = 0;
462 int munged = 0, is_sign;
463 size_t plen;
464 int squash_ad = 0;
465
466 #ifdef HAVE_IPSET
467 /* Similar algorithm to search_servers. */
468 struct ipsets *ipset_pos;
469 unsigned int namelen = strlen(daemon->namebuff);
470 unsigned int matchlen = 0;
471 for (ipset_pos = daemon->ipsets; ipset_pos; ipset_pos = ipset_pos->next)
472 {
473 unsigned int domainlen = strlen(ipset_pos->domain);
474 char *matchstart = daemon->namebuff + namelen - domainlen;
475 if (namelen >= domainlen && hostname_isequal(matchstart, ipset_pos->domain) &&
476 (domainlen == 0 || namelen == domainlen || *(matchstart - 1) == '.' ) &&
477 domainlen >= matchlen) {
478 matchlen = domainlen;
479 sets = ipset_pos->sets;
480 }
481 }
482 #endif
483
484 /* If upstream is advertising a larger UDP packet size
485 than we allow, trim it so that we don't get overlarge
486 requests for the client. We can't do this for signed packets. */
487
488 if ((pheader = find_pseudoheader(header, n, &plen, &sizep, &is_sign)))
489 {
490 if (!is_sign)
491 {
492 unsigned short udpsz;
493 unsigned char *psave = sizep;
494
495 GETSHORT(udpsz, sizep);
496 if (udpsz > daemon->edns_pktsz)
497 PUTSHORT(daemon->edns_pktsz, psave);
498 }
499
500 if (check_subnet && !check_source(header, plen, pheader, query_source))
501 {
502 my_syslog(LOG_WARNING, _("discarding DNS reply: subnet option mismatch"));
503 return 0;
504 }
505 }
506
507 /* RFC 4035 sect 4.6 para 3 */
508 if (!is_sign && !option_bool(OPT_DNSSEC_PROXY))
509 squash_ad = 1;
510
511 #ifdef HAVE_DNSSEC
512 if (option_bool(OPT_DNSSEC_VALID))
513 squash_ad = no_cache;
514
515 if (cache_secure)
516 header->hb4 |= HB4_AD;
517 #endif
518
519 if (squash_ad)
520 header->hb4 &= ~HB4_AD;
521
522 if (OPCODE(header) != QUERY || (RCODE(header) != NOERROR && RCODE(header) != NXDOMAIN))
523 return n;
524
525 /* Complain loudly if the upstream server is non-recursive. */
526 if (!(header->hb4 & HB4_RA) && RCODE(header) == NOERROR && ntohs(header->ancount) == 0 &&
527 server && !(server->flags & SERV_WARNED_RECURSIVE))
528 {
529 prettyprint_addr(&server->addr, daemon->namebuff);
530 my_syslog(LOG_WARNING, _("nameserver %s refused to do a recursive query"), daemon->namebuff);
531 if (!option_bool(OPT_LOG))
532 server->flags |= SERV_WARNED_RECURSIVE;
533 }
534
535 if (daemon->bogus_addr && RCODE(header) != NXDOMAIN &&
536 check_for_bogus_wildcard(header, n, daemon->namebuff, daemon->bogus_addr, now))
537 {
538 munged = 1;
539 SET_RCODE(header, NXDOMAIN);
540 header->hb3 &= ~HB3_AA;
541 }
542 else
543 {
544 if (RCODE(header) == NXDOMAIN &&
545 extract_request(header, n, daemon->namebuff, NULL) &&
546 check_for_local_domain(daemon->namebuff, now))
547 {
548 /* if we forwarded a query for a locally known name (because it was for
549 an unknown type) and the answer is NXDOMAIN, convert that to NODATA,
550 since we know that the domain exists, even if upstream doesn't */
551 munged = 1;
552 header->hb3 |= HB3_AA;
553 SET_RCODE(header, NOERROR);
554 }
555
556 if (extract_addresses(header, n, daemon->namebuff, now, sets, is_sign, check_rebind, no_cache, cache_secure))
557 {
558 my_syslog(LOG_WARNING, _("possible DNS-rebind attack detected: %s"), daemon->namebuff);
559 munged = 1;
560 }
561 }
562
563 /* do this after extract_addresses. Ensure NODATA reply and remove
564 nameserver info. */
565
566 if (munged)
567 {
568 header->ancount = htons(0);
569 header->nscount = htons(0);
570 header->arcount = htons(0);
571 }
572
573 /* the bogus-nxdomain stuff, doctor and NXDOMAIN->NODATA munging can all elide
574 sections of the packet. Find the new length here and put back pseudoheader
575 if it was removed. */
576 return resize_packet(header, n, pheader, plen);
577 }
578
579 /* sets new last_server */
580 void reply_query(int fd, int family, time_t now)
581 {
582 /* packet from peer server, extract data for cache, and send to
583 original requester */
584 struct dns_header *header;
585 union mysockaddr serveraddr;
586 struct frec *forward;
587 socklen_t addrlen = sizeof(serveraddr);
588 ssize_t n = recvfrom(fd, daemon->packet, daemon->packet_buff_sz, 0, &serveraddr.sa, &addrlen);
589 size_t nn;
590 struct server *server;
591
592 /* packet buffer overwritten */
593 daemon->srv_save = NULL;
594
595 /* Determine the address of the server replying so that we can mark that as good */
596 serveraddr.sa.sa_family = family;
597 #ifdef HAVE_IPV6
598 if (serveraddr.sa.sa_family == AF_INET6)
599 serveraddr.in6.sin6_flowinfo = 0;
600 #endif
601
602 /* spoof check: answer must come from known server, */
603 for (server = daemon->servers; server; server = server->next)
604 if (!(server->flags & (SERV_LITERAL_ADDRESS | SERV_NO_ADDR)) &&
605 sockaddr_isequal(&server->addr, &serveraddr))
606 break;
607
608 header = (struct dns_header *)daemon->packet;
609
610 if (!server ||
611 n < (int)sizeof(struct dns_header) || !(header->hb3 & HB3_QR) ||
612 !(forward = lookup_frec(ntohs(header->id), questions_crc(header, n, daemon->namebuff))))
613 return;
614
615 if ((RCODE(header) == SERVFAIL || RCODE(header) == REFUSED) &&
616 !option_bool(OPT_ORDER) &&
617 forward->forwardall == 0)
618 /* for broken servers, attempt to send to another one. */
619 {
620 unsigned char *pheader;
621 size_t plen;
622 int is_sign;
623
624 /* recreate query from reply */
625 pheader = find_pseudoheader(header, (size_t)n, &plen, NULL, &is_sign);
626 if (!is_sign)
627 {
628 header->ancount = htons(0);
629 header->nscount = htons(0);
630 header->arcount = htons(0);
631 if ((nn = resize_packet(header, (size_t)n, pheader, plen)))
632 {
633 header->hb3 &= ~(HB3_QR | HB3_TC);
634 forward_query(-1, NULL, NULL, 0, header, nn, now, forward);
635 return;
636 }
637 }
638 }
639
640 server = forward->sentto;
641
642 if ((forward->sentto->flags & SERV_TYPE) == 0)
643 {
644 if (RCODE(header) == SERVFAIL || RCODE(header) == REFUSED)
645 server = NULL;
646 else
647 {
648 struct server *last_server;
649
650 /* find good server by address if possible, otherwise assume the last one we sent to */
651 for (last_server = daemon->servers; last_server; last_server = last_server->next)
652 if (!(last_server->flags & (SERV_LITERAL_ADDRESS | SERV_HAS_DOMAIN | SERV_FOR_NODOTS | SERV_NO_ADDR)) &&
653 sockaddr_isequal(&last_server->addr, &serveraddr))
654 {
655 server = last_server;
656 break;
657 }
658 }
659 if (!option_bool(OPT_ALL_SERVERS))
660 daemon->last_server = server;
661 }
662
663 /* If the answer is an error, keep the forward record in place in case
664 we get a good reply from another server. Kill it when we've
665 had replies from all to avoid filling the forwarding table when
666 everything is broken */
667 if (forward->forwardall == 0 || --forward->forwardall == 1 ||
668 (RCODE(header) != REFUSED && RCODE(header) != SERVFAIL))
669 {
670 int check_rebind = 0, no_cache_dnssec = 0, cache_secure = 0;
671
672 if (option_bool(OPT_NO_REBIND))
673 check_rebind = !(forward->flags & FREC_NOREBIND);
674
675 /* Don't cache replies where DNSSEC validation was turned off, either
676 the upstream server told us so, or the original query specified it. */
677 if ((header->hb4 & HB4_CD) || (forward->flags & FREC_CHECKING_DISABLED))
678 no_cache_dnssec = 1;
679
680 #ifdef HAVE_DNSSEC
681 if (option_bool(OPT_DNSSEC_VALID) && !(forward->flags & FREC_CHECKING_DISABLED))
682 {
683 int status;
684
685 /* We've had a reply already, which we're validating. Ignore this duplicate */
686 if (forward->stash)
687 return;
688
689 if (header->hb3 & HB3_TC)
690 {
691 /* Truncated answer can't be validated.
692 The client will retry over TCP, but if this is an answer to a
693 DNSSEC-generated query, we have a problem. Should really re-send
694 over TCP. No-one with any sense will make a DNSKEY or DS RRset
695 exceed 4096, so this may not be a real problem. Just log
696 for now. */
697 if (forward->flags & (FREC_DNSKEY_QUERY | FREC_DS_QUERY))
698 my_syslog(LOG_ERR, _("Reply to DNSSEC query truncated - validation fails."));
699 status = STAT_INSECURE;
700 }
701 else if (forward->flags & FREC_DNSKEY_QUERY)
702 status = dnssec_validate_by_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
703 else if (forward->flags & FREC_DS_QUERY)
704 status = dnssec_validate_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
705 else
706 status = dnssec_validate_reply(now, header, n, daemon->namebuff, daemon->keyname, &forward->class);
707
708 /* Can't validate, as we're missing key data. Put this
709 answer aside, whilst we get that. */
710 if (status == STAT_NEED_DS || status == STAT_NEED_KEY)
711 {
712 struct frec *new;
713
714 if ((new = get_new_frec(now, NULL, 1)))
715 {
716 struct frec *next = new->next;
717 *new = *forward; /* copy everything, then overwrite */
718 new->next = next;
719 new->stash = NULL;
720 new->blocking_query = NULL;
721 new->rfd4 = NULL;
722 #ifdef HAVE_IPV6
723 new->rfd6 = NULL;
724 #endif
725 new->flags &= ~(FREC_DNSKEY_QUERY | FREC_DS_QUERY);
726
727 if ((forward->stash = blockdata_alloc((char *)header, n)))
728 {
729 int fd;
730
731 forward->stash_len = n;
732
733 new->dependent = forward; /* to find query awaiting new one. */
734 forward->blocking_query = new; /* for garbage cleaning */
735 /* validate routines leave name of required record in daemon->keyname */
736 if (status == STAT_NEED_KEY)
737 {
738 new->flags |= FREC_DNSKEY_QUERY;
739 nn = dnssec_generate_query(header, ((char *) header) + daemon->packet_buff_sz,
740 daemon->keyname, forward->class, T_DNSKEY, &server->addr);
741 }
742 else if (status == STAT_NEED_DS)
743 {
744 new->flags |= FREC_DS_QUERY;
745 nn = dnssec_generate_query(header,((char *) header) + daemon->packet_buff_sz,
746 daemon->keyname, forward->class, T_DS, &server->addr);
747 }
748 new->crc = questions_crc(header, nn, daemon->namebuff);
749 new->new_id = get_id(new->crc);
750 header->id = htons(new->new_id);
751
752 /* Don't resend this. */
753 daemon->srv_save = NULL;
754
755 if (server->sfd)
756 fd = server->sfd->fd;
757 else
758 {
759 fd = -1;
760 #ifdef HAVE_IPV6
761 if (server->addr.sa.sa_family == AF_INET6)
762 {
763 if (new->rfd6 || (new->rfd6 = allocate_rfd(AF_INET6)))
764 fd = new->rfd6->fd;
765 }
766 else
767 #endif
768 {
769 if (new->rfd4 || (new->rfd4 = allocate_rfd(AF_INET)))
770 fd = new->rfd4->fd;
771 }
772 }
773
774 if (fd != -1)
775 {
776 while (sendto(fd, (char *)header, nn, 0, &server->addr.sa, sa_len(&server->addr)) == -1 && retry_send());
777 server->queries++;
778 }
779 }
780 }
781
782 return;
783 }
784
785 /* Ok, we reached far enough up the chain-of-trust that we can validate something.
786 Now wind back down, pulling back answers which wouldn't previously validate
787 and validate them with the new data. Failure to find needed data here is an internal error.
788 Once we get to the original answer (FREC_DNSSEC_QUERY not set) and it validates,
789 return it to the original requestor. */
790 if (forward->flags & (FREC_DNSKEY_QUERY | FREC_DS_QUERY))
791 {
792 while (forward->dependent)
793 {
794 struct frec *prev;
795
796 if (status == STAT_SECURE)
797 {
798 if (forward->flags & FREC_DNSKEY_QUERY)
799 status = dnssec_validate_by_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
800 else if (forward->flags & FREC_DS_QUERY)
801 status = dnssec_validate_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
802 }
803
804 prev = forward->dependent;
805 free_frec(forward);
806 forward = prev;
807 forward->blocking_query = NULL; /* already gone */
808 blockdata_retrieve(forward->stash, forward->stash_len, (void *)header);
809 n = forward->stash_len;
810 }
811
812 /* All DNSKEY and DS records done and in cache, now finally validate original
813 answer, provided last DNSKEY is OK. */
814 if (status == STAT_SECURE)
815 status = dnssec_validate_reply(now, header, n, daemon->namebuff, daemon->keyname, &forward->class);
816
817 if (status == STAT_NEED_DS || status == STAT_NEED_KEY)
818 {
819 my_syslog(LOG_ERR, _("Unexpected missing data for DNSSEC validation"));
820 status = STAT_INSECURE;
821 }
822 }
823
824 log_query(F_KEYTAG | F_SECSTAT, "result", NULL,
825 status == STAT_SECURE ? "SECURE" : (status == STAT_INSECURE ? "INSECURE" : "BOGUS"));
826
827 no_cache_dnssec = 0;
828
829 if (status == STAT_SECURE)
830 cache_secure = 1;
831 /* TODO return SERVFAIL here */
832 else if (status == STAT_BOGUS)
833 no_cache_dnssec = 1;
834
835 /* restore CD bit to the value in the query */
836 if (forward->flags & FREC_CHECKING_DISABLED)
837 header->hb4 |= HB4_CD;
838 else
839 header->hb4 &= ~HB4_CD;
840 }
841 #endif
842
843 if ((nn = process_reply(header, now, server, (size_t)n, check_rebind, no_cache_dnssec, cache_secure,
844 forward->flags & FREC_HAS_SUBNET, &forward->source)))
845 {
846 header->id = htons(forward->orig_id);
847 header->hb4 |= HB4_RA; /* recursion if available */
848 send_from(forward->fd, option_bool(OPT_NOWILD) || option_bool (OPT_CLEVERBIND), daemon->packet, nn,
849 &forward->source, &forward->dest, forward->iface);
850 }
851 free_frec(forward); /* cancel */
852 }
853 }
854
855
856 void receive_query(struct listener *listen, time_t now)
857 {
858 struct dns_header *header = (struct dns_header *)daemon->packet;
859 union mysockaddr source_addr;
860 unsigned short type;
861 struct all_addr dst_addr;
862 struct in_addr netmask, dst_addr_4;
863 size_t m;
864 ssize_t n;
865 int if_index = 0, auth_dns = 0;
866 #ifdef HAVE_AUTH
867 int local_auth = 0;
868 #endif
869 struct iovec iov[1];
870 struct msghdr msg;
871 struct cmsghdr *cmptr;
872 union {
873 struct cmsghdr align; /* this ensures alignment */
874 #ifdef HAVE_IPV6
875 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
876 #endif
877 #if defined(HAVE_LINUX_NETWORK)
878 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
879 #elif defined(IP_RECVDSTADDR) && defined(HAVE_SOLARIS_NETWORK)
880 char control[CMSG_SPACE(sizeof(struct in_addr)) +
881 CMSG_SPACE(sizeof(unsigned int))];
882 #elif defined(IP_RECVDSTADDR)
883 char control[CMSG_SPACE(sizeof(struct in_addr)) +
884 CMSG_SPACE(sizeof(struct sockaddr_dl))];
885 #endif
886 } control_u;
887 #ifdef HAVE_IPV6
888 /* Can always get recvd interface for IPv6 */
889 int check_dst = !option_bool(OPT_NOWILD) || listen->family == AF_INET6;
890 #else
891 int check_dst = !option_bool(OPT_NOWILD);
892 #endif
893
894 /* packet buffer overwritten */
895 daemon->srv_save = NULL;
896
897 dst_addr_4.s_addr = 0;
898 netmask.s_addr = 0;
899
900 if (option_bool(OPT_NOWILD) && listen->iface)
901 {
902 auth_dns = listen->iface->dns_auth;
903
904 if (listen->family == AF_INET)
905 {
906 dst_addr_4 = listen->iface->addr.in.sin_addr;
907 netmask = listen->iface->netmask;
908 }
909 }
910
911 iov[0].iov_base = daemon->packet;
912 iov[0].iov_len = daemon->edns_pktsz;
913
914 msg.msg_control = control_u.control;
915 msg.msg_controllen = sizeof(control_u);
916 msg.msg_flags = 0;
917 msg.msg_name = &source_addr;
918 msg.msg_namelen = sizeof(source_addr);
919 msg.msg_iov = iov;
920 msg.msg_iovlen = 1;
921
922 if ((n = recvmsg(listen->fd, &msg, 0)) == -1)
923 return;
924
925 if (n < (int)sizeof(struct dns_header) ||
926 (msg.msg_flags & MSG_TRUNC) ||
927 (header->hb3 & HB3_QR))
928 return;
929
930 source_addr.sa.sa_family = listen->family;
931 #ifdef HAVE_IPV6
932 if (listen->family == AF_INET6)
933 source_addr.in6.sin6_flowinfo = 0;
934 #endif
935
936 if (check_dst)
937 {
938 struct ifreq ifr;
939
940 if (msg.msg_controllen < sizeof(struct cmsghdr))
941 return;
942
943 #if defined(HAVE_LINUX_NETWORK)
944 if (listen->family == AF_INET)
945 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
946 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_PKTINFO)
947 {
948 union {
949 unsigned char *c;
950 struct in_pktinfo *p;
951 } p;
952 p.c = CMSG_DATA(cmptr);
953 dst_addr_4 = dst_addr.addr.addr4 = p.p->ipi_spec_dst;
954 if_index = p.p->ipi_ifindex;
955 }
956 #elif defined(IP_RECVDSTADDR) && defined(IP_RECVIF)
957 if (listen->family == AF_INET)
958 {
959 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
960 {
961 union {
962 unsigned char *c;
963 unsigned int *i;
964 struct in_addr *a;
965 #ifndef HAVE_SOLARIS_NETWORK
966 struct sockaddr_dl *s;
967 #endif
968 } p;
969 p.c = CMSG_DATA(cmptr);
970 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVDSTADDR)
971 dst_addr_4 = dst_addr.addr.addr4 = *(p.a);
972 else if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVIF)
973 #ifdef HAVE_SOLARIS_NETWORK
974 if_index = *(p.i);
975 #else
976 if_index = p.s->sdl_index;
977 #endif
978 }
979 }
980 #endif
981
982 #ifdef HAVE_IPV6
983 if (listen->family == AF_INET6)
984 {
985 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
986 if (cmptr->cmsg_level == IPPROTO_IPV6 && cmptr->cmsg_type == daemon->v6pktinfo)
987 {
988 union {
989 unsigned char *c;
990 struct in6_pktinfo *p;
991 } p;
992 p.c = CMSG_DATA(cmptr);
993
994 dst_addr.addr.addr6 = p.p->ipi6_addr;
995 if_index = p.p->ipi6_ifindex;
996 }
997 }
998 #endif
999
1000 /* enforce available interface configuration */
1001
1002 if (!indextoname(listen->fd, if_index, ifr.ifr_name))
1003 return;
1004
1005 if (!iface_check(listen->family, &dst_addr, ifr.ifr_name, &auth_dns))
1006 {
1007 if (!option_bool(OPT_CLEVERBIND))
1008 enumerate_interfaces(0);
1009 if (!loopback_exception(listen->fd, listen->family, &dst_addr, ifr.ifr_name) &&
1010 !label_exception(if_index, listen->family, &dst_addr))
1011 return;
1012 }
1013
1014 if (listen->family == AF_INET && option_bool(OPT_LOCALISE))
1015 {
1016 struct irec *iface;
1017
1018 /* get the netmask of the interface whch has the address we were sent to.
1019 This is no neccessarily the interface we arrived on. */
1020
1021 for (iface = daemon->interfaces; iface; iface = iface->next)
1022 if (iface->addr.sa.sa_family == AF_INET &&
1023 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
1024 break;
1025
1026 /* interface may be new */
1027 if (!iface && !option_bool(OPT_CLEVERBIND))
1028 enumerate_interfaces(0);
1029
1030 for (iface = daemon->interfaces; iface; iface = iface->next)
1031 if (iface->addr.sa.sa_family == AF_INET &&
1032 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
1033 break;
1034
1035 /* If we failed, abandon localisation */
1036 if (iface)
1037 netmask = iface->netmask;
1038 else
1039 dst_addr_4.s_addr = 0;
1040 }
1041 }
1042
1043 if (extract_request(header, (size_t)n, daemon->namebuff, &type))
1044 {
1045 char types[20];
1046 #ifdef HAVE_AUTH
1047 struct auth_zone *zone;
1048 #endif
1049
1050 querystr(auth_dns ? "auth" : "query", types, type);
1051
1052 if (listen->family == AF_INET)
1053 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
1054 (struct all_addr *)&source_addr.in.sin_addr, types);
1055 #ifdef HAVE_IPV6
1056 else
1057 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
1058 (struct all_addr *)&source_addr.in6.sin6_addr, types);
1059 #endif
1060
1061 #ifdef HAVE_AUTH
1062 /* find queries for zones we're authoritative for, and answer them directly */
1063 if (!auth_dns)
1064 for (zone = daemon->auth_zones; zone; zone = zone->next)
1065 if (in_zone(zone, daemon->namebuff, NULL))
1066 {
1067 auth_dns = 1;
1068 local_auth = 1;
1069 break;
1070 }
1071 #endif
1072 }
1073
1074 #ifdef HAVE_AUTH
1075 if (auth_dns)
1076 {
1077 m = answer_auth(header, ((char *) header) + daemon->packet_buff_sz, (size_t)n, now, &source_addr, local_auth);
1078 if (m >= 1)
1079 {
1080 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
1081 (char *)header, m, &source_addr, &dst_addr, if_index);
1082 daemon->auth_answer++;
1083 }
1084 }
1085 else
1086 #endif
1087 {
1088 m = answer_request(header, ((char *) header) + daemon->packet_buff_sz, (size_t)n,
1089 dst_addr_4, netmask, now);
1090
1091 if (m >= 1)
1092 {
1093 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
1094 (char *)header, m, &source_addr, &dst_addr, if_index);
1095 daemon->local_answer++;
1096 }
1097 else if (forward_query(listen->fd, &source_addr, &dst_addr, if_index,
1098 header, (size_t)n, now, NULL))
1099 daemon->queries_forwarded++;
1100 else
1101 daemon->local_answer++;
1102 }
1103 }
1104
1105 #ifdef HAVE_DNSSEC
1106 static int tcp_key_recurse(time_t now, int status, int class, char *keyname, struct server *server)
1107 {
1108 /* Recurse up the key heirarchy */
1109 size_t n;
1110 unsigned char *packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16));
1111 unsigned char *payload = &packet[2];
1112 struct dns_header *header = (struct dns_header *)payload;
1113 u16 *length = (u16 *)packet;
1114 int new_status;
1115 unsigned char c1, c2;
1116
1117 n = dnssec_generate_query(header, ((char *) header) + 65536, keyname, class,
1118 status == STAT_NEED_KEY ? T_DNSKEY : T_DS, &server->addr);
1119
1120 *length = htons(n);
1121
1122 if (!read_write(server->tcpfd, packet, n + sizeof(u16), 0) ||
1123 !read_write(server->tcpfd, &c1, 1, 1) ||
1124 !read_write(server->tcpfd, &c2, 1, 1) ||
1125 !read_write(server->tcpfd, payload, (c1 << 8) | c2, 1))
1126 {
1127 close(server->tcpfd);
1128 server->tcpfd = -1;
1129 new_status = STAT_INSECURE;
1130 }
1131 else
1132 {
1133 n = (c1 << 8) | c2;
1134
1135 if (status == STAT_NEED_KEY)
1136 new_status = dnssec_validate_by_ds(now, header, n, daemon->namebuff, daemon->keyname, class);
1137 else
1138 new_status = dnssec_validate_ds(now, header, n, daemon->namebuff, daemon->keyname, class);
1139
1140 if (new_status == STAT_NEED_DS || new_status == STAT_NEED_KEY)
1141 {
1142 if ((new_status = tcp_key_recurse(now, new_status, class, daemon->keyname, server) == STAT_SECURE))
1143 {
1144 if (status == STAT_NEED_KEY)
1145 new_status = dnssec_validate_by_ds(now, header, n, daemon->namebuff, daemon->keyname, class);
1146 else
1147 new_status = dnssec_validate_ds(now, header, n, daemon->namebuff, daemon->keyname, class);
1148
1149 if (new_status == STAT_NEED_DS || new_status == STAT_NEED_KEY)
1150 {
1151 my_syslog(LOG_ERR, _("Unexpected missing data for DNSSEC validation"));
1152 status = STAT_INSECURE;
1153 }
1154 }
1155 }
1156 }
1157
1158 free(packet);
1159
1160 return new_status;
1161 }
1162 #endif
1163
1164
1165 /* The daemon forks before calling this: it should deal with one connection,
1166 blocking as neccessary, and then return. Note, need to be a bit careful
1167 about resources for debug mode, when the fork is suppressed: that's
1168 done by the caller. */
1169 unsigned char *tcp_request(int confd, time_t now,
1170 union mysockaddr *local_addr, struct in_addr netmask, int auth_dns)
1171 {
1172 size_t size = 0;
1173 int norebind = 0;
1174 #ifdef HAVE_AUTH
1175 int local_auth = 0;
1176 #endif
1177 int checking_disabled, check_subnet, no_cache_dnssec = 0, cache_secure = 0;
1178 size_t m;
1179 unsigned short qtype;
1180 unsigned int gotname;
1181 unsigned char c1, c2;
1182 /* Max TCP packet + slop + size */
1183 unsigned char *packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16));
1184 unsigned char *payload = &packet[2];
1185 /* largest field in header is 16-bits, so this is still sufficiently aligned */
1186 struct dns_header *header = (struct dns_header *)payload;
1187 u16 *length = (u16 *)packet;
1188 struct server *last_server;
1189 struct in_addr dst_addr_4;
1190 union mysockaddr peer_addr;
1191 socklen_t peer_len = sizeof(union mysockaddr);
1192
1193 if (getpeername(confd, (struct sockaddr *)&peer_addr, &peer_len) == -1)
1194 return packet;
1195
1196 while (1)
1197 {
1198 if (!packet ||
1199 !read_write(confd, &c1, 1, 1) || !read_write(confd, &c2, 1, 1) ||
1200 !(size = c1 << 8 | c2) ||
1201 !read_write(confd, payload, size, 1))
1202 return packet;
1203
1204 if (size < (int)sizeof(struct dns_header))
1205 continue;
1206
1207 check_subnet = 0;
1208
1209 /* save state of "cd" flag in query */
1210 if ((checking_disabled = header->hb4 & HB4_CD))
1211 no_cache_dnssec = 1;
1212
1213 /* RFC 4035: sect 4.6 para 2 */
1214 header->hb4 &= ~HB4_AD;
1215
1216 if ((gotname = extract_request(header, (unsigned int)size, daemon->namebuff, &qtype)))
1217 {
1218 char types[20];
1219 #ifdef HAVE_AUTH
1220 struct auth_zone *zone;
1221 #endif
1222 querystr(auth_dns ? "auth" : "query", types, qtype);
1223
1224 if (peer_addr.sa.sa_family == AF_INET)
1225 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
1226 (struct all_addr *)&peer_addr.in.sin_addr, types);
1227 #ifdef HAVE_IPV6
1228 else
1229 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
1230 (struct all_addr *)&peer_addr.in6.sin6_addr, types);
1231 #endif
1232
1233 #ifdef HAVE_AUTH
1234 /* find queries for zones we're authoritative for, and answer them directly */
1235 if (!auth_dns)
1236 for (zone = daemon->auth_zones; zone; zone = zone->next)
1237 if (in_zone(zone, daemon->namebuff, NULL))
1238 {
1239 auth_dns = 1;
1240 local_auth = 1;
1241 break;
1242 }
1243 #endif
1244 }
1245
1246 if (local_addr->sa.sa_family == AF_INET)
1247 dst_addr_4 = local_addr->in.sin_addr;
1248 else
1249 dst_addr_4.s_addr = 0;
1250
1251 #ifdef HAVE_AUTH
1252 if (auth_dns)
1253 m = answer_auth(header, ((char *) header) + 65536, (size_t)size, now, &peer_addr, local_auth);
1254 else
1255 #endif
1256 {
1257 /* m > 0 if answered from cache */
1258 m = answer_request(header, ((char *) header) + 65536, (size_t)size,
1259 dst_addr_4, netmask, now);
1260
1261 /* Do this by steam now we're not in the select() loop */
1262 check_log_writer(NULL);
1263
1264 if (m == 0)
1265 {
1266 unsigned int flags = 0;
1267 struct all_addr *addrp = NULL;
1268 int type = 0;
1269 char *domain = NULL;
1270
1271 if (option_bool(OPT_ADD_MAC))
1272 size = add_mac(header, size, ((char *) header) + 65536, &peer_addr);
1273
1274 if (option_bool(OPT_CLIENT_SUBNET))
1275 {
1276 size_t new = add_source_addr(header, size, ((char *) header) + 65536, &peer_addr);
1277 if (size != new)
1278 {
1279 size = new;
1280 check_subnet = 1;
1281 }
1282 }
1283
1284 if (gotname)
1285 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
1286
1287 if (type != 0 || option_bool(OPT_ORDER) || !daemon->last_server)
1288 last_server = daemon->servers;
1289 else
1290 last_server = daemon->last_server;
1291
1292 if (!flags && last_server)
1293 {
1294 struct server *firstsendto = NULL;
1295 unsigned int crc = questions_crc(header, (unsigned int)size, daemon->namebuff);
1296
1297 /* Loop round available servers until we succeed in connecting to one.
1298 Note that this code subtley ensures that consecutive queries on this connection
1299 which can go to the same server, do so. */
1300 while (1)
1301 {
1302 if (!firstsendto)
1303 firstsendto = last_server;
1304 else
1305 {
1306 if (!(last_server = last_server->next))
1307 last_server = daemon->servers;
1308
1309 if (last_server == firstsendto)
1310 break;
1311 }
1312
1313 /* server for wrong domain */
1314 if (type != (last_server->flags & SERV_TYPE) ||
1315 (type == SERV_HAS_DOMAIN && !hostname_isequal(domain, last_server->domain)))
1316 continue;
1317
1318 if (last_server->tcpfd == -1)
1319 {
1320 if ((last_server->tcpfd = socket(last_server->addr.sa.sa_family, SOCK_STREAM, 0)) == -1)
1321 continue;
1322
1323 if ((!local_bind(last_server->tcpfd, &last_server->source_addr, last_server->interface, 1) ||
1324 connect(last_server->tcpfd, &last_server->addr.sa, sa_len(&last_server->addr)) == -1))
1325 {
1326 close(last_server->tcpfd);
1327 last_server->tcpfd = -1;
1328 continue;
1329 }
1330
1331 #ifdef HAVE_DNSSEC
1332 if (option_bool(OPT_DNSSEC_VALID))
1333 {
1334 size = add_do_bit(header, size, ((char *) header) + 65536);
1335 header->hb4 |= HB4_CD;
1336 }
1337 #endif
1338
1339 #ifdef HAVE_CONNTRACK
1340 /* Copy connection mark of incoming query to outgoing connection. */
1341 if (option_bool(OPT_CONNTRACK))
1342 {
1343 unsigned int mark;
1344 struct all_addr local;
1345 #ifdef HAVE_IPV6
1346 if (local_addr->sa.sa_family == AF_INET6)
1347 local.addr.addr6 = local_addr->in6.sin6_addr;
1348 else
1349 #endif
1350 local.addr.addr4 = local_addr->in.sin_addr;
1351
1352 if (get_incoming_mark(&peer_addr, &local, 1, &mark))
1353 setsockopt(last_server->tcpfd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
1354 }
1355 #endif
1356 }
1357
1358 *length = htons(size);
1359
1360 if (!read_write(last_server->tcpfd, packet, size + sizeof(u16), 0) ||
1361 !read_write(last_server->tcpfd, &c1, 1, 1) ||
1362 !read_write(last_server->tcpfd, &c2, 1, 1) ||
1363 !read_write(last_server->tcpfd, payload, (c1 << 8) | c2, 1))
1364 {
1365 close(last_server->tcpfd);
1366 last_server->tcpfd = -1;
1367 continue;
1368 }
1369
1370 m = (c1 << 8) | c2;
1371
1372 if (!gotname)
1373 strcpy(daemon->namebuff, "query");
1374 if (last_server->addr.sa.sa_family == AF_INET)
1375 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
1376 (struct all_addr *)&last_server->addr.in.sin_addr, NULL);
1377 #ifdef HAVE_IPV6
1378 else
1379 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
1380 (struct all_addr *)&last_server->addr.in6.sin6_addr, NULL);
1381 #endif
1382
1383 #ifdef HAVE_DNSSEC
1384 if (option_bool(OPT_DNSSEC_VALID) && !checking_disabled)
1385 {
1386 int class, status;
1387
1388 status = dnssec_validate_reply(now, header, m, daemon->namebuff, daemon->keyname, &class);
1389
1390 if (status == STAT_NEED_DS || status == STAT_NEED_KEY)
1391 {
1392 if ((status = tcp_key_recurse(now, status, class, daemon->keyname, last_server)) == STAT_SECURE)
1393 status = dnssec_validate_reply(now, header, m, daemon->namebuff, daemon->keyname, &class);
1394 }
1395
1396 log_query(F_KEYTAG | F_SECSTAT, "result", NULL,
1397 status == STAT_SECURE ? "SECURE" : (status == STAT_INSECURE ? "INSECURE" : "BOGUS"));
1398
1399 if (status == STAT_BOGUS)
1400 no_cache_dnssec = 1;
1401
1402 if (status == STAT_SECURE)
1403 cache_secure = 1;
1404 }
1405 #endif
1406
1407 /* restore CD bit to the value in the query */
1408 if (checking_disabled)
1409 header->hb4 |= HB4_CD;
1410 else
1411 header->hb4 &= ~HB4_CD;
1412
1413 /* There's no point in updating the cache, since this process will exit and
1414 lose the information after a few queries. We make this call for the alias and
1415 bogus-nxdomain side-effects. */
1416 /* If the crc of the question section doesn't match the crc we sent, then
1417 someone might be attempting to insert bogus values into the cache by
1418 sending replies containing questions and bogus answers. */
1419 if (crc == questions_crc(header, (unsigned int)m, daemon->namebuff))
1420 m = process_reply(header, now, last_server, (unsigned int)m,
1421 option_bool(OPT_NO_REBIND) && !norebind, no_cache_dnssec,
1422 cache_secure, check_subnet, &peer_addr);
1423
1424 break;
1425 }
1426 }
1427
1428 /* In case of local answer or no connections made. */
1429 if (m == 0)
1430 m = setup_reply(header, (unsigned int)size, addrp, flags, daemon->local_ttl);
1431 }
1432 }
1433
1434 check_log_writer(NULL);
1435
1436 *length = htons(m);
1437
1438 if (m == 0 || !read_write(confd, packet, m + sizeof(u16), 0))
1439 return packet;
1440 }
1441 }
1442
1443 static struct frec *allocate_frec(time_t now)
1444 {
1445 struct frec *f;
1446
1447 if ((f = (struct frec *)whine_malloc(sizeof(struct frec))))
1448 {
1449 f->next = daemon->frec_list;
1450 f->time = now;
1451 f->sentto = NULL;
1452 f->rfd4 = NULL;
1453 f->flags = 0;
1454 #ifdef HAVE_IPV6
1455 f->rfd6 = NULL;
1456 #endif
1457 #ifdef HAVE_DNSSEC
1458 f->blocking_query = NULL;
1459 #endif
1460 daemon->frec_list = f;
1461 }
1462
1463 return f;
1464 }
1465
1466 static struct randfd *allocate_rfd(int family)
1467 {
1468 static int finger = 0;
1469 int i;
1470
1471 /* limit the number of sockets we have open to avoid starvation of
1472 (eg) TFTP. Once we have a reasonable number, randomness should be OK */
1473
1474 for (i = 0; i < RANDOM_SOCKS; i++)
1475 if (daemon->randomsocks[i].refcount == 0)
1476 {
1477 if ((daemon->randomsocks[i].fd = random_sock(family)) == -1)
1478 break;
1479
1480 daemon->randomsocks[i].refcount = 1;
1481 daemon->randomsocks[i].family = family;
1482 return &daemon->randomsocks[i];
1483 }
1484
1485 /* No free ones or cannot get new socket, grab an existing one */
1486 for (i = 0; i < RANDOM_SOCKS; i++)
1487 {
1488 int j = (i+finger) % RANDOM_SOCKS;
1489 if (daemon->randomsocks[j].refcount != 0 &&
1490 daemon->randomsocks[j].family == family &&
1491 daemon->randomsocks[j].refcount != 0xffff)
1492 {
1493 finger = j;
1494 daemon->randomsocks[j].refcount++;
1495 return &daemon->randomsocks[j];
1496 }
1497 }
1498
1499 return NULL; /* doom */
1500 }
1501 static void free_frec(struct frec *f)
1502 {
1503 if (f->rfd4 && --(f->rfd4->refcount) == 0)
1504 close(f->rfd4->fd);
1505
1506 f->rfd4 = NULL;
1507 f->sentto = NULL;
1508 f->flags = 0;
1509
1510 #ifdef HAVE_IPV6
1511 if (f->rfd6 && --(f->rfd6->refcount) == 0)
1512 close(f->rfd6->fd);
1513
1514 f->rfd6 = NULL;
1515 #endif
1516
1517 #ifdef HAVE_DNSSEC
1518 if (f->stash)
1519 {
1520 blockdata_free(f->stash);
1521 f->stash = NULL;
1522 }
1523
1524 /* Anything we're waiting on is pointless now, too */
1525 if (f->blocking_query)
1526 free_frec(f->blocking_query);
1527 f->blocking_query = NULL;
1528
1529 #endif
1530 }
1531
1532 /* if wait==NULL return a free or older than TIMEOUT record.
1533 else return *wait zero if one available, or *wait is delay to
1534 when the oldest in-use record will expire. Impose an absolute
1535 limit of 4*TIMEOUT before we wipe things (for random sockets).
1536 If force is set, always return a result, even if we have
1537 to allocate above the limit. */
1538 struct frec *get_new_frec(time_t now, int *wait, int force)
1539 {
1540 struct frec *f, *oldest, *target;
1541 int count;
1542
1543 if (wait)
1544 *wait = 0;
1545
1546 for (f = daemon->frec_list, oldest = NULL, target = NULL, count = 0; f; f = f->next, count++)
1547 if (!f->sentto)
1548 target = f;
1549 else
1550 {
1551 if (difftime(now, f->time) >= 4*TIMEOUT)
1552 {
1553 free_frec(f);
1554 target = f;
1555 }
1556
1557 if (!oldest || difftime(f->time, oldest->time) <= 0)
1558 oldest = f;
1559 }
1560
1561 if (target)
1562 {
1563 target->time = now;
1564 return target;
1565 }
1566
1567 /* can't find empty one, use oldest if there is one
1568 and it's older than timeout */
1569 if (oldest && ((int)difftime(now, oldest->time)) >= TIMEOUT)
1570 {
1571 /* keep stuff for twice timeout if we can by allocating a new
1572 record instead */
1573 if (difftime(now, oldest->time) < 2*TIMEOUT &&
1574 count <= daemon->ftabsize &&
1575 (f = allocate_frec(now)))
1576 return f;
1577
1578 if (!wait)
1579 {
1580 free_frec(oldest);
1581 oldest->time = now;
1582 }
1583 return oldest;
1584 }
1585
1586 /* none available, calculate time 'till oldest record expires */
1587 if (!force && count > daemon->ftabsize)
1588 {
1589 static time_t last_log = 0;
1590
1591 if (oldest && wait)
1592 *wait = oldest->time + (time_t)TIMEOUT - now;
1593
1594 if ((int)difftime(now, last_log) > 5)
1595 {
1596 last_log = now;
1597 my_syslog(LOG_WARNING, _("Maximum number of concurrent DNS queries reached (max: %d)"), daemon->ftabsize);
1598 }
1599
1600 return NULL;
1601 }
1602
1603 if (!(f = allocate_frec(now)) && wait)
1604 /* wait one second on malloc failure */
1605 *wait = 1;
1606
1607 return f; /* OK if malloc fails and this is NULL */
1608 }
1609
1610 /* crc is all-ones if not known. */
1611 static struct frec *lookup_frec(unsigned short id, unsigned int crc)
1612 {
1613 struct frec *f;
1614
1615 for(f = daemon->frec_list; f; f = f->next)
1616 if (f->sentto && f->new_id == id &&
1617 (f->crc == crc || crc == 0xffffffff))
1618 return f;
1619
1620 return NULL;
1621 }
1622
1623 static struct frec *lookup_frec_by_sender(unsigned short id,
1624 union mysockaddr *addr,
1625 unsigned int crc)
1626 {
1627 struct frec *f;
1628
1629 for(f = daemon->frec_list; f; f = f->next)
1630 if (f->sentto &&
1631 f->orig_id == id &&
1632 f->crc == crc &&
1633 sockaddr_isequal(&f->source, addr))
1634 return f;
1635
1636 return NULL;
1637 }
1638
1639 /* A server record is going away, remove references to it */
1640 void server_gone(struct server *server)
1641 {
1642 struct frec *f;
1643
1644 for (f = daemon->frec_list; f; f = f->next)
1645 if (f->sentto && f->sentto == server)
1646 free_frec(f);
1647
1648 if (daemon->last_server == server)
1649 daemon->last_server = NULL;
1650
1651 if (daemon->srv_save == server)
1652 daemon->srv_save = NULL;
1653 }
1654
1655 /* return unique random ids. */
1656 static unsigned short get_id(unsigned int crc)
1657 {
1658 unsigned short ret = 0;
1659
1660 do
1661 ret = rand16();
1662 while (lookup_frec(ret, crc));
1663
1664 return ret;
1665 }
1666
1667
1668
1669
1670