]> git.ipfire.org Git - people/ms/dnsmasq.git/blob - src/forward.c
DNSSEC for TCP queries.
[people/ms/dnsmasq.git] / src / forward.c
1 /* dnsmasq is Copyright (c) 2000-2013 Simon Kelley
2
3 This program is free software; you can redistribute it and/or modify
4 it under the terms of the GNU General Public License as published by
5 the Free Software Foundation; version 2 dated June, 1991, or
6 (at your option) version 3 dated 29 June, 2007.
7
8 This program is distributed in the hope that it will be useful,
9 but WITHOUT ANY WARRANTY; without even the implied warranty of
10 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11 GNU General Public License for more details.
12
13 You should have received a copy of the GNU General Public License
14 along with this program. If not, see <http://www.gnu.org/licenses/>.
15 */
16
17 #include "dnsmasq.h"
18
19 static struct frec *lookup_frec(unsigned short id, unsigned int crc);
20 static struct frec *lookup_frec_by_sender(unsigned short id,
21 union mysockaddr *addr,
22 unsigned int crc);
23 static unsigned short get_id(unsigned int crc);
24 static void free_frec(struct frec *f);
25 static struct randfd *allocate_rfd(int family);
26
27 /* Send a UDP packet with its source address set as "source"
28 unless nowild is true, when we just send it with the kernel default */
29 int send_from(int fd, int nowild, char *packet, size_t len,
30 union mysockaddr *to, struct all_addr *source,
31 unsigned int iface)
32 {
33 struct msghdr msg;
34 struct iovec iov[1];
35 union {
36 struct cmsghdr align; /* this ensures alignment */
37 #if defined(HAVE_LINUX_NETWORK)
38 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
39 #elif defined(IP_SENDSRCADDR)
40 char control[CMSG_SPACE(sizeof(struct in_addr))];
41 #endif
42 #ifdef HAVE_IPV6
43 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
44 #endif
45 } control_u;
46
47 iov[0].iov_base = packet;
48 iov[0].iov_len = len;
49
50 msg.msg_control = NULL;
51 msg.msg_controllen = 0;
52 msg.msg_flags = 0;
53 msg.msg_name = to;
54 msg.msg_namelen = sa_len(to);
55 msg.msg_iov = iov;
56 msg.msg_iovlen = 1;
57
58 if (!nowild)
59 {
60 struct cmsghdr *cmptr;
61 msg.msg_control = &control_u;
62 msg.msg_controllen = sizeof(control_u);
63 cmptr = CMSG_FIRSTHDR(&msg);
64
65 if (to->sa.sa_family == AF_INET)
66 {
67 #if defined(HAVE_LINUX_NETWORK)
68 struct in_pktinfo p;
69 p.ipi_ifindex = 0;
70 p.ipi_spec_dst = source->addr.addr4;
71 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
72 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_pktinfo));
73 cmptr->cmsg_level = IPPROTO_IP;
74 cmptr->cmsg_type = IP_PKTINFO;
75 #elif defined(IP_SENDSRCADDR)
76 memcpy(CMSG_DATA(cmptr), &(source->addr.addr4), sizeof(source->addr.addr4));
77 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_addr));
78 cmptr->cmsg_level = IPPROTO_IP;
79 cmptr->cmsg_type = IP_SENDSRCADDR;
80 #endif
81 }
82 else
83 #ifdef HAVE_IPV6
84 {
85 struct in6_pktinfo p;
86 p.ipi6_ifindex = iface; /* Need iface for IPv6 to handle link-local addrs */
87 p.ipi6_addr = source->addr.addr6;
88 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
89 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in6_pktinfo));
90 cmptr->cmsg_type = daemon->v6pktinfo;
91 cmptr->cmsg_level = IPPROTO_IPV6;
92 }
93 #else
94 (void)iface; /* eliminate warning */
95 #endif
96 }
97
98 while (sendmsg(fd, &msg, 0) == -1)
99 {
100 if (retry_send())
101 continue;
102
103 /* If interface is still in DAD, EINVAL results - ignore that. */
104 if (errno == EINVAL)
105 break;
106
107 my_syslog(LOG_ERR, _("failed to send packet: %s"), strerror(errno));
108 return 0;
109 }
110
111 return 1;
112 }
113
114 static unsigned int search_servers(time_t now, struct all_addr **addrpp,
115 unsigned int qtype, char *qdomain, int *type, char **domain, int *norebind)
116
117 {
118 /* If the query ends in the domain in one of our servers, set
119 domain to point to that name. We find the largest match to allow both
120 domain.org and sub.domain.org to exist. */
121
122 unsigned int namelen = strlen(qdomain);
123 unsigned int matchlen = 0;
124 struct server *serv;
125 unsigned int flags = 0;
126
127 for (serv = daemon->servers; serv; serv=serv->next)
128 /* domain matches take priority over NODOTS matches */
129 if ((serv->flags & SERV_FOR_NODOTS) && *type != SERV_HAS_DOMAIN && !strchr(qdomain, '.') && namelen != 0)
130 {
131 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
132 *type = SERV_FOR_NODOTS;
133 if (serv->flags & SERV_NO_ADDR)
134 flags = F_NXDOMAIN;
135 else if (serv->flags & SERV_LITERAL_ADDRESS)
136 {
137 if (sflag & qtype)
138 {
139 flags = sflag;
140 if (serv->addr.sa.sa_family == AF_INET)
141 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
142 #ifdef HAVE_IPV6
143 else
144 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
145 #endif
146 }
147 else if (!flags || (flags & F_NXDOMAIN))
148 flags = F_NOERR;
149 }
150 }
151 else if (serv->flags & SERV_HAS_DOMAIN)
152 {
153 unsigned int domainlen = strlen(serv->domain);
154 char *matchstart = qdomain + namelen - domainlen;
155 if (namelen >= domainlen &&
156 hostname_isequal(matchstart, serv->domain) &&
157 (domainlen == 0 || namelen == domainlen || *(matchstart-1) == '.' ))
158 {
159 if (serv->flags & SERV_NO_REBIND)
160 *norebind = 1;
161 else
162 {
163 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
164 /* implement priority rules for --address and --server for same domain.
165 --address wins if the address is for the correct AF
166 --server wins otherwise. */
167 if (domainlen != 0 && domainlen == matchlen)
168 {
169 if ((serv->flags & SERV_LITERAL_ADDRESS))
170 {
171 if (!(sflag & qtype) && flags == 0)
172 continue;
173 }
174 else
175 {
176 if (flags & (F_IPV4 | F_IPV6))
177 continue;
178 }
179 }
180
181 if (domainlen >= matchlen)
182 {
183 *type = serv->flags & (SERV_HAS_DOMAIN | SERV_USE_RESOLV | SERV_NO_REBIND);
184 *domain = serv->domain;
185 matchlen = domainlen;
186 if (serv->flags & SERV_NO_ADDR)
187 flags = F_NXDOMAIN;
188 else if (serv->flags & SERV_LITERAL_ADDRESS)
189 {
190 if (sflag & qtype)
191 {
192 flags = sflag;
193 if (serv->addr.sa.sa_family == AF_INET)
194 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
195 #ifdef HAVE_IPV6
196 else
197 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
198 #endif
199 }
200 else if (!flags || (flags & F_NXDOMAIN))
201 flags = F_NOERR;
202 }
203 else
204 flags = 0;
205 }
206 }
207 }
208 }
209
210 if (flags == 0 && !(qtype & F_QUERY) &&
211 option_bool(OPT_NODOTS_LOCAL) && !strchr(qdomain, '.') && namelen != 0)
212 /* don't forward A or AAAA queries for simple names, except the empty name */
213 flags = F_NOERR;
214
215 if (flags == F_NXDOMAIN && check_for_local_domain(qdomain, now))
216 flags = F_NOERR;
217
218 if (flags)
219 {
220 int logflags = 0;
221
222 if (flags == F_NXDOMAIN || flags == F_NOERR)
223 logflags = F_NEG | qtype;
224
225 log_query(logflags | flags | F_CONFIG | F_FORWARD, qdomain, *addrpp, NULL);
226 }
227 else if ((*type) & SERV_USE_RESOLV)
228 {
229 *type = 0; /* use normal servers for this domain */
230 *domain = NULL;
231 }
232 return flags;
233 }
234
235 static int forward_query(int udpfd, union mysockaddr *udpaddr,
236 struct all_addr *dst_addr, unsigned int dst_iface,
237 struct dns_header *header, size_t plen, time_t now, struct frec *forward)
238 {
239 char *domain = NULL;
240 int type = 0, norebind = 0;
241 struct all_addr *addrp = NULL;
242 unsigned int crc = questions_crc(header, plen, daemon->namebuff);
243 unsigned int flags = 0;
244 unsigned int gotname = extract_request(header, plen, daemon->namebuff, NULL);
245 struct server *start = NULL;
246
247 /* RFC 4035: sect 4.6 para 2 */
248 header->hb4 &= ~HB4_AD;
249
250 /* may be no servers available. */
251 if (!daemon->servers)
252 forward = NULL;
253 else if (forward || (forward = lookup_frec_by_sender(ntohs(header->id), udpaddr, crc)))
254 {
255 /* retry on existing query, send to all available servers */
256 domain = forward->sentto->domain;
257 forward->sentto->failed_queries++;
258 if (!option_bool(OPT_ORDER))
259 {
260 forward->forwardall = 1;
261 daemon->last_server = NULL;
262 }
263 type = forward->sentto->flags & SERV_TYPE;
264 if (!(start = forward->sentto->next))
265 start = daemon->servers; /* at end of list, recycle */
266 header->id = htons(forward->new_id);
267 }
268 else
269 {
270 if (gotname)
271 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
272
273 if (!flags && !(forward = get_new_frec(now, NULL, 0)))
274 /* table full - server failure. */
275 flags = F_NEG;
276
277 if (forward)
278 {
279 forward->source = *udpaddr;
280 forward->dest = *dst_addr;
281 forward->iface = dst_iface;
282 forward->orig_id = ntohs(header->id);
283 forward->new_id = get_id(crc);
284 forward->fd = udpfd;
285 forward->crc = crc;
286 forward->forwardall = 0;
287 forward->flags = 0;
288 if (norebind)
289 forward->flags |= FREC_NOREBIND;
290 if (header->hb4 & HB4_CD)
291 forward->flags |= FREC_CHECKING_DISABLED;
292
293 header->id = htons(forward->new_id);
294
295 /* In strict_order mode, always try servers in the order
296 specified in resolv.conf, if a domain is given
297 always try all the available servers,
298 otherwise, use the one last known to work. */
299
300 if (type == 0)
301 {
302 if (option_bool(OPT_ORDER))
303 start = daemon->servers;
304 else if (!(start = daemon->last_server) ||
305 daemon->forwardcount++ > FORWARD_TEST ||
306 difftime(now, daemon->forwardtime) > FORWARD_TIME)
307 {
308 start = daemon->servers;
309 forward->forwardall = 1;
310 daemon->forwardcount = 0;
311 daemon->forwardtime = now;
312 }
313 }
314 else
315 {
316 start = daemon->servers;
317 if (!option_bool(OPT_ORDER))
318 forward->forwardall = 1;
319 }
320 }
321 }
322
323 /* check for send errors here (no route to host)
324 if we fail to send to all nameservers, send back an error
325 packet straight away (helps modem users when offline) */
326
327 if (!flags && forward)
328 {
329 struct server *firstsentto = start;
330 int forwarded = 0;
331
332 if (option_bool(OPT_ADD_MAC))
333 plen = add_mac(header, plen, ((char *) header) + daemon->packet_buff_sz, &forward->source);
334
335 if (option_bool(OPT_CLIENT_SUBNET))
336 {
337 size_t new = add_source_addr(header, plen, ((char *) header) + daemon->packet_buff_sz, &forward->source);
338 if (new != plen)
339 {
340 plen = new;
341 forward->flags |= FREC_HAS_SUBNET;
342 }
343 }
344
345 #ifdef HAVE_DNSSEC
346 if (option_bool(OPT_DNSSEC_VALID))
347 {
348 plen = add_do_bit(header, plen, ((char *) header) + daemon->packet_buff_sz);
349 header->hb4 |= HB4_CD;
350 }
351 #endif
352
353 while (1)
354 {
355 /* only send to servers dealing with our domain.
356 domain may be NULL, in which case server->domain
357 must be NULL also. */
358
359 if (type == (start->flags & SERV_TYPE) &&
360 (type != SERV_HAS_DOMAIN || hostname_isequal(domain, start->domain)) &&
361 !(start->flags & SERV_LITERAL_ADDRESS))
362 {
363 int fd;
364
365 /* find server socket to use, may need to get random one. */
366 if (start->sfd)
367 fd = start->sfd->fd;
368 else
369 {
370 #ifdef HAVE_IPV6
371 if (start->addr.sa.sa_family == AF_INET6)
372 {
373 if (!forward->rfd6 &&
374 !(forward->rfd6 = allocate_rfd(AF_INET6)))
375 break;
376 daemon->rfd_save = forward->rfd6;
377 fd = forward->rfd6->fd;
378 }
379 else
380 #endif
381 {
382 if (!forward->rfd4 &&
383 !(forward->rfd4 = allocate_rfd(AF_INET)))
384 break;
385 daemon->rfd_save = forward->rfd4;
386 fd = forward->rfd4->fd;
387 }
388
389 #ifdef HAVE_CONNTRACK
390 /* Copy connection mark of incoming query to outgoing connection. */
391 if (option_bool(OPT_CONNTRACK))
392 {
393 unsigned int mark;
394 if (get_incoming_mark(&forward->source, &forward->dest, 0, &mark))
395 setsockopt(fd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
396 }
397 #endif
398 }
399
400 if (sendto(fd, (char *)header, plen, 0,
401 &start->addr.sa,
402 sa_len(&start->addr)) == -1)
403 {
404 if (retry_send())
405 continue;
406 }
407 else
408 {
409 /* Keep info in case we want to re-send this packet */
410 daemon->srv_save = start;
411 daemon->packet_len = plen;
412
413 if (!gotname)
414 strcpy(daemon->namebuff, "query");
415 if (start->addr.sa.sa_family == AF_INET)
416 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
417 (struct all_addr *)&start->addr.in.sin_addr, NULL);
418 #ifdef HAVE_IPV6
419 else
420 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
421 (struct all_addr *)&start->addr.in6.sin6_addr, NULL);
422 #endif
423 start->queries++;
424 forwarded = 1;
425 forward->sentto = start;
426 if (!forward->forwardall)
427 break;
428 forward->forwardall++;
429 }
430 }
431
432 if (!(start = start->next))
433 start = daemon->servers;
434
435 if (start == firstsentto)
436 break;
437 }
438
439 if (forwarded)
440 return 1;
441
442 /* could not send on, prepare to return */
443 header->id = htons(forward->orig_id);
444 free_frec(forward); /* cancel */
445 }
446
447 /* could not send on, return empty answer or address if known for whole domain */
448 if (udpfd != -1)
449 {
450 plen = setup_reply(header, plen, addrp, flags, daemon->local_ttl);
451 send_from(udpfd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND), (char *)header, plen, udpaddr, dst_addr, dst_iface);
452 }
453
454 return 0;
455 }
456
457 static size_t process_reply(struct dns_header *header, time_t now, struct server *server, size_t n, int check_rebind,
458 int no_cache, int cache_secure, int check_subnet, union mysockaddr *query_source)
459 {
460 unsigned char *pheader, *sizep;
461 char **sets = 0;
462 int munged = 0, is_sign;
463 size_t plen;
464 int squash_ad = 0;
465
466 #ifdef HAVE_IPSET
467 /* Similar algorithm to search_servers. */
468 struct ipsets *ipset_pos;
469 unsigned int namelen = strlen(daemon->namebuff);
470 unsigned int matchlen = 0;
471 for (ipset_pos = daemon->ipsets; ipset_pos; ipset_pos = ipset_pos->next)
472 {
473 unsigned int domainlen = strlen(ipset_pos->domain);
474 char *matchstart = daemon->namebuff + namelen - domainlen;
475 if (namelen >= domainlen && hostname_isequal(matchstart, ipset_pos->domain) &&
476 (domainlen == 0 || namelen == domainlen || *(matchstart - 1) == '.' ) &&
477 domainlen >= matchlen) {
478 matchlen = domainlen;
479 sets = ipset_pos->sets;
480 }
481 }
482 #endif
483
484 /* If upstream is advertising a larger UDP packet size
485 than we allow, trim it so that we don't get overlarge
486 requests for the client. We can't do this for signed packets. */
487
488 if ((pheader = find_pseudoheader(header, n, &plen, &sizep, &is_sign)))
489 {
490 if (!is_sign)
491 {
492 unsigned short udpsz;
493 unsigned char *psave = sizep;
494
495 GETSHORT(udpsz, sizep);
496 if (udpsz > daemon->edns_pktsz)
497 PUTSHORT(daemon->edns_pktsz, psave);
498 }
499
500 if (check_subnet && !check_source(header, plen, pheader, query_source))
501 {
502 my_syslog(LOG_WARNING, _("discarding DNS reply: subnet option mismatch"));
503 return 0;
504 }
505 }
506
507 /* RFC 4035 sect 4.6 para 3 */
508 if (!is_sign && !option_bool(OPT_DNSSEC_PROXY))
509 squash_ad = 1;
510
511 #ifdef HAVE_DNSSEC
512 if (option_bool(OPT_DNSSEC_VALID))
513 squash_ad = no_cache;
514
515 if (cache_secure)
516 header->hb4 |= HB4_AD;
517 #endif
518
519 if (squash_ad)
520 header->hb4 &= ~HB4_AD;
521
522 if (OPCODE(header) != QUERY || (RCODE(header) != NOERROR && RCODE(header) != NXDOMAIN))
523 return n;
524
525 /* Complain loudly if the upstream server is non-recursive. */
526 if (!(header->hb4 & HB4_RA) && RCODE(header) == NOERROR && ntohs(header->ancount) == 0 &&
527 server && !(server->flags & SERV_WARNED_RECURSIVE))
528 {
529 prettyprint_addr(&server->addr, daemon->namebuff);
530 my_syslog(LOG_WARNING, _("nameserver %s refused to do a recursive query"), daemon->namebuff);
531 if (!option_bool(OPT_LOG))
532 server->flags |= SERV_WARNED_RECURSIVE;
533 }
534
535 if (daemon->bogus_addr && RCODE(header) != NXDOMAIN &&
536 check_for_bogus_wildcard(header, n, daemon->namebuff, daemon->bogus_addr, now))
537 {
538 munged = 1;
539 SET_RCODE(header, NXDOMAIN);
540 header->hb3 &= ~HB3_AA;
541 }
542 else
543 {
544 if (RCODE(header) == NXDOMAIN &&
545 extract_request(header, n, daemon->namebuff, NULL) &&
546 check_for_local_domain(daemon->namebuff, now))
547 {
548 /* if we forwarded a query for a locally known name (because it was for
549 an unknown type) and the answer is NXDOMAIN, convert that to NODATA,
550 since we know that the domain exists, even if upstream doesn't */
551 munged = 1;
552 header->hb3 |= HB3_AA;
553 SET_RCODE(header, NOERROR);
554 }
555
556 if (extract_addresses(header, n, daemon->namebuff, now, sets, is_sign, check_rebind, no_cache, cache_secure))
557 {
558 my_syslog(LOG_WARNING, _("possible DNS-rebind attack detected: %s"), daemon->namebuff);
559 munged = 1;
560 }
561 }
562
563 /* do this after extract_addresses. Ensure NODATA reply and remove
564 nameserver info. */
565
566 if (munged)
567 {
568 header->ancount = htons(0);
569 header->nscount = htons(0);
570 header->arcount = htons(0);
571 }
572
573 /* the bogus-nxdomain stuff, doctor and NXDOMAIN->NODATA munging can all elide
574 sections of the packet. Find the new length here and put back pseudoheader
575 if it was removed. */
576 return resize_packet(header, n, pheader, plen);
577 }
578
579 /* sets new last_server */
580 void reply_query(int fd, int family, time_t now)
581 {
582 /* packet from peer server, extract data for cache, and send to
583 original requester */
584 struct dns_header *header;
585 union mysockaddr serveraddr;
586 struct frec *forward;
587 socklen_t addrlen = sizeof(serveraddr);
588 ssize_t n = recvfrom(fd, daemon->packet, daemon->packet_buff_sz, 0, &serveraddr.sa, &addrlen);
589 size_t nn;
590 struct server *server;
591
592 /* packet buffer overwritten */
593 daemon->srv_save = NULL;
594
595 /* Determine the address of the server replying so that we can mark that as good */
596 serveraddr.sa.sa_family = family;
597 #ifdef HAVE_IPV6
598 if (serveraddr.sa.sa_family == AF_INET6)
599 serveraddr.in6.sin6_flowinfo = 0;
600 #endif
601
602 /* spoof check: answer must come from known server, */
603 for (server = daemon->servers; server; server = server->next)
604 if (!(server->flags & (SERV_LITERAL_ADDRESS | SERV_NO_ADDR)) &&
605 sockaddr_isequal(&server->addr, &serveraddr))
606 break;
607
608 header = (struct dns_header *)daemon->packet;
609
610 if (!server ||
611 n < (int)sizeof(struct dns_header) || !(header->hb3 & HB3_QR) ||
612 !(forward = lookup_frec(ntohs(header->id), questions_crc(header, n, daemon->namebuff))))
613 return;
614
615 if ((RCODE(header) == SERVFAIL || RCODE(header) == REFUSED) &&
616 !option_bool(OPT_ORDER) &&
617 forward->forwardall == 0)
618 /* for broken servers, attempt to send to another one. */
619 {
620 unsigned char *pheader;
621 size_t plen;
622 int is_sign;
623
624 /* recreate query from reply */
625 pheader = find_pseudoheader(header, (size_t)n, &plen, NULL, &is_sign);
626 if (!is_sign)
627 {
628 header->ancount = htons(0);
629 header->nscount = htons(0);
630 header->arcount = htons(0);
631 if ((nn = resize_packet(header, (size_t)n, pheader, plen)))
632 {
633 header->hb3 &= ~(HB3_QR | HB3_TC);
634 forward_query(-1, NULL, NULL, 0, header, nn, now, forward);
635 return;
636 }
637 }
638 }
639
640 server = forward->sentto;
641
642 if ((forward->sentto->flags & SERV_TYPE) == 0)
643 {
644 if (RCODE(header) == SERVFAIL || RCODE(header) == REFUSED)
645 server = NULL;
646 else
647 {
648 struct server *last_server;
649
650 /* find good server by address if possible, otherwise assume the last one we sent to */
651 for (last_server = daemon->servers; last_server; last_server = last_server->next)
652 if (!(last_server->flags & (SERV_LITERAL_ADDRESS | SERV_HAS_DOMAIN | SERV_FOR_NODOTS | SERV_NO_ADDR)) &&
653 sockaddr_isequal(&last_server->addr, &serveraddr))
654 {
655 server = last_server;
656 break;
657 }
658 }
659 if (!option_bool(OPT_ALL_SERVERS))
660 daemon->last_server = server;
661 }
662
663 /* If the answer is an error, keep the forward record in place in case
664 we get a good reply from another server. Kill it when we've
665 had replies from all to avoid filling the forwarding table when
666 everything is broken */
667 if (forward->forwardall == 0 || --forward->forwardall == 1 ||
668 (RCODE(header) != REFUSED && RCODE(header) != SERVFAIL))
669 {
670 int check_rebind = 0, no_cache_dnssec = 0, cache_secure = 0;
671
672 if (option_bool(OPT_NO_REBIND))
673 check_rebind = !(forward->flags & FREC_NOREBIND);
674
675 /* Don't cache replies where DNSSEC validation was turned off, either
676 the upstream server told us so, or the original query specified it. */
677 if ((header->hb4 & HB4_CD) || (forward->flags & FREC_CHECKING_DISABLED))
678 no_cache_dnssec = 1;
679
680 #ifdef HAVE_DNSSEC
681 if (option_bool(OPT_DNSSEC_VALID) && !(forward->flags & FREC_CHECKING_DISABLED))
682 {
683 int status;
684
685 /* We've had a reply already, which we're validating. Ignore this duplicate */
686 if (forward->stash)
687 return;
688
689 if (header->hb3 & HB3_TC)
690 {
691 /* Truncated answer can't be validated.
692 The client will retry over TCP, but if this is an answer to a
693 DNSSEC-generated query, we have a problem. Should really re-send
694 over TCP. No-one with any sense will make a DNSKEY or DS RRset
695 exceed 4096, so this may not be a real problem. Just log
696 for now. */
697 if (forward->flags & (FREC_DNSKEY_QUERY | FREC_DS_QUERY))
698 my_syslog(LOG_ERR, _("Reply to DNSSEC query truncated - validation fails."));
699 status = STAT_INSECURE;
700 }
701 else if (forward->flags & FREC_DNSKEY_QUERY)
702 status = dnssec_validate_by_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
703 else if (forward->flags & FREC_DS_QUERY)
704 status = dnssec_validate_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
705 else
706 status = dnssec_validate_reply(now, header, n, daemon->namebuff, daemon->keyname, &forward->class);
707
708 /* Can't validate, as we're missing key data. Put this
709 answer aside, whilst we get that. */
710 if (status == STAT_NEED_DS || status == STAT_NEED_KEY)
711 {
712 struct frec *new;
713
714 if ((new = get_new_frec(now, NULL, 1)))
715 {
716 struct frec *next = new->next;
717 *new = *forward; /* copy everything, then overwrite */
718 new->next = next;
719 new->stash = NULL;
720 new->blocking_query = NULL;
721 new->flags &= ~(FREC_DNSKEY_QUERY | FREC_DS_QUERY);
722
723 if ((forward->stash = blockdata_alloc((char *)header, n)))
724 {
725 int fd;
726
727 forward->stash_len = n;
728
729 new->dependent = forward; /* to find query awaiting new one. */
730 forward->blocking_query = new; /* for garbage cleaning */
731 /* validate routines leave name of required record in daemon->keyname */
732 if (status == STAT_NEED_KEY)
733 {
734 new->flags |= FREC_DNSKEY_QUERY;
735 nn = dnssec_generate_query(header, ((char *) header) + daemon->packet_buff_sz,
736 daemon->keyname, forward->class, T_DNSKEY, &server->addr);
737 }
738 else if (status == STAT_NEED_DS)
739 {
740 new->flags |= FREC_DS_QUERY;
741 nn = dnssec_generate_query(header,((char *) header) + daemon->packet_buff_sz,
742 daemon->keyname, forward->class, T_DS, &server->addr);
743 }
744 new->crc = questions_crc(header, nn, daemon->namebuff);
745 new->new_id = get_id(new->crc);
746 header->id = htons(new->new_id);
747
748 /* Don't resend this. */
749 daemon->srv_save = NULL;
750
751 if (server->sfd)
752 fd = server->sfd->fd;
753 else
754 #ifdef HAVE_IPV6
755 /* Note that we use the same random port for the DNSSEC stuff */
756 if (server->addr.sa.sa_family == AF_INET6)
757 {
758 fd = new->rfd6->fd;
759 new->rfd6->refcount++;
760 }
761 else
762 #endif
763 {
764 fd = new->rfd4->fd;
765 new->rfd4->refcount++;
766 }
767
768 /* Send DNSSEC query to same server as original query */
769 while (sendto(fd, (char *)header, nn, 0, &server->addr.sa, sa_len(&server->addr)) == -1 && retry_send());
770 server->queries++;
771 }
772 }
773
774 return;
775 }
776
777 /* Ok, we reached far enough up the chain-of-trust that we can validate something.
778 Now wind back down, pulling back answers which wouldn't previously validate
779 and validate them with the new data. Failure to find needed data here is an internal error.
780 Once we get to the original answer (FREC_DNSSEC_QUERY not set) and it validates,
781 return it to the original requestor. */
782 if (forward->flags & (FREC_DNSKEY_QUERY | FREC_DS_QUERY))
783 {
784 while (forward->dependent)
785 {
786 struct frec *prev;
787
788 if (status == STAT_SECURE)
789 {
790 if (forward->flags & FREC_DNSKEY_QUERY)
791 status = dnssec_validate_by_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
792 else if (forward->flags & FREC_DS_QUERY)
793 status = dnssec_validate_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
794 }
795
796 prev = forward->dependent;
797 free_frec(forward);
798 forward = prev;
799 forward->blocking_query = NULL; /* already gone */
800 blockdata_retrieve(forward->stash, forward->stash_len, (void *)header);
801 n = forward->stash_len;
802 }
803
804 /* All DNSKEY and DS records done and in cache, now finally validate original
805 answer, provided last DNSKEY is OK. */
806 if (status == STAT_SECURE)
807 status = dnssec_validate_reply(now, header, n, daemon->namebuff, daemon->keyname, &forward->class);
808
809 if (status == STAT_NEED_DS || status == STAT_NEED_KEY)
810 {
811 my_syslog(LOG_ERR, _("Unexpected missing data for DNSSEC validation"));
812 status = STAT_INSECURE;
813 }
814 }
815
816 log_query(F_KEYTAG | F_SECSTAT, "result", NULL,
817 status == STAT_SECURE ? "SECURE" : (status == STAT_INSECURE ? "INSECURE" : "BOGUS"));
818
819 no_cache_dnssec = 0;
820
821 if (status == STAT_SECURE)
822 cache_secure = 1;
823 /* TODO return SERVFAIL here */
824 else if (status == STAT_BOGUS)
825 no_cache_dnssec = 1;
826
827 /* restore CD bit to the value in the query */
828 if (forward->flags & FREC_CHECKING_DISABLED)
829 header->hb4 |= HB4_CD;
830 else
831 header->hb4 &= ~HB4_CD;
832 }
833 #endif
834
835 if ((nn = process_reply(header, now, server, (size_t)n, check_rebind, no_cache_dnssec, cache_secure,
836 forward->flags & FREC_HAS_SUBNET, &forward->source)))
837 {
838 header->id = htons(forward->orig_id);
839 header->hb4 |= HB4_RA; /* recursion if available */
840 send_from(forward->fd, option_bool(OPT_NOWILD) || option_bool (OPT_CLEVERBIND), daemon->packet, nn,
841 &forward->source, &forward->dest, forward->iface);
842 }
843 free_frec(forward); /* cancel */
844 }
845 }
846
847
848 void receive_query(struct listener *listen, time_t now)
849 {
850 struct dns_header *header = (struct dns_header *)daemon->packet;
851 union mysockaddr source_addr;
852 unsigned short type;
853 struct all_addr dst_addr;
854 struct in_addr netmask, dst_addr_4;
855 size_t m;
856 ssize_t n;
857 int if_index = 0, auth_dns = 0;
858 #ifdef HAVE_AUTH
859 int local_auth = 0;
860 #endif
861 struct iovec iov[1];
862 struct msghdr msg;
863 struct cmsghdr *cmptr;
864 union {
865 struct cmsghdr align; /* this ensures alignment */
866 #ifdef HAVE_IPV6
867 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
868 #endif
869 #if defined(HAVE_LINUX_NETWORK)
870 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
871 #elif defined(IP_RECVDSTADDR) && defined(HAVE_SOLARIS_NETWORK)
872 char control[CMSG_SPACE(sizeof(struct in_addr)) +
873 CMSG_SPACE(sizeof(unsigned int))];
874 #elif defined(IP_RECVDSTADDR)
875 char control[CMSG_SPACE(sizeof(struct in_addr)) +
876 CMSG_SPACE(sizeof(struct sockaddr_dl))];
877 #endif
878 } control_u;
879 #ifdef HAVE_IPV6
880 /* Can always get recvd interface for IPv6 */
881 int check_dst = !option_bool(OPT_NOWILD) || listen->family == AF_INET6;
882 #else
883 int check_dst = !option_bool(OPT_NOWILD);
884 #endif
885
886 /* packet buffer overwritten */
887 daemon->srv_save = NULL;
888
889 dst_addr_4.s_addr = 0;
890 netmask.s_addr = 0;
891
892 if (option_bool(OPT_NOWILD) && listen->iface)
893 {
894 auth_dns = listen->iface->dns_auth;
895
896 if (listen->family == AF_INET)
897 {
898 dst_addr_4 = listen->iface->addr.in.sin_addr;
899 netmask = listen->iface->netmask;
900 }
901 }
902
903 iov[0].iov_base = daemon->packet;
904 iov[0].iov_len = daemon->edns_pktsz;
905
906 msg.msg_control = control_u.control;
907 msg.msg_controllen = sizeof(control_u);
908 msg.msg_flags = 0;
909 msg.msg_name = &source_addr;
910 msg.msg_namelen = sizeof(source_addr);
911 msg.msg_iov = iov;
912 msg.msg_iovlen = 1;
913
914 if ((n = recvmsg(listen->fd, &msg, 0)) == -1)
915 return;
916
917 if (n < (int)sizeof(struct dns_header) ||
918 (msg.msg_flags & MSG_TRUNC) ||
919 (header->hb3 & HB3_QR))
920 return;
921
922 source_addr.sa.sa_family = listen->family;
923 #ifdef HAVE_IPV6
924 if (listen->family == AF_INET6)
925 source_addr.in6.sin6_flowinfo = 0;
926 #endif
927
928 if (check_dst)
929 {
930 struct ifreq ifr;
931
932 if (msg.msg_controllen < sizeof(struct cmsghdr))
933 return;
934
935 #if defined(HAVE_LINUX_NETWORK)
936 if (listen->family == AF_INET)
937 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
938 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_PKTINFO)
939 {
940 union {
941 unsigned char *c;
942 struct in_pktinfo *p;
943 } p;
944 p.c = CMSG_DATA(cmptr);
945 dst_addr_4 = dst_addr.addr.addr4 = p.p->ipi_spec_dst;
946 if_index = p.p->ipi_ifindex;
947 }
948 #elif defined(IP_RECVDSTADDR) && defined(IP_RECVIF)
949 if (listen->family == AF_INET)
950 {
951 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
952 {
953 union {
954 unsigned char *c;
955 unsigned int *i;
956 struct in_addr *a;
957 #ifndef HAVE_SOLARIS_NETWORK
958 struct sockaddr_dl *s;
959 #endif
960 } p;
961 p.c = CMSG_DATA(cmptr);
962 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVDSTADDR)
963 dst_addr_4 = dst_addr.addr.addr4 = *(p.a);
964 else if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVIF)
965 #ifdef HAVE_SOLARIS_NETWORK
966 if_index = *(p.i);
967 #else
968 if_index = p.s->sdl_index;
969 #endif
970 }
971 }
972 #endif
973
974 #ifdef HAVE_IPV6
975 if (listen->family == AF_INET6)
976 {
977 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
978 if (cmptr->cmsg_level == IPPROTO_IPV6 && cmptr->cmsg_type == daemon->v6pktinfo)
979 {
980 union {
981 unsigned char *c;
982 struct in6_pktinfo *p;
983 } p;
984 p.c = CMSG_DATA(cmptr);
985
986 dst_addr.addr.addr6 = p.p->ipi6_addr;
987 if_index = p.p->ipi6_ifindex;
988 }
989 }
990 #endif
991
992 /* enforce available interface configuration */
993
994 if (!indextoname(listen->fd, if_index, ifr.ifr_name))
995 return;
996
997 if (!iface_check(listen->family, &dst_addr, ifr.ifr_name, &auth_dns))
998 {
999 if (!option_bool(OPT_CLEVERBIND))
1000 enumerate_interfaces(0);
1001 if (!loopback_exception(listen->fd, listen->family, &dst_addr, ifr.ifr_name) &&
1002 !label_exception(if_index, listen->family, &dst_addr))
1003 return;
1004 }
1005
1006 if (listen->family == AF_INET && option_bool(OPT_LOCALISE))
1007 {
1008 struct irec *iface;
1009
1010 /* get the netmask of the interface whch has the address we were sent to.
1011 This is no neccessarily the interface we arrived on. */
1012
1013 for (iface = daemon->interfaces; iface; iface = iface->next)
1014 if (iface->addr.sa.sa_family == AF_INET &&
1015 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
1016 break;
1017
1018 /* interface may be new */
1019 if (!iface && !option_bool(OPT_CLEVERBIND))
1020 enumerate_interfaces(0);
1021
1022 for (iface = daemon->interfaces; iface; iface = iface->next)
1023 if (iface->addr.sa.sa_family == AF_INET &&
1024 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
1025 break;
1026
1027 /* If we failed, abandon localisation */
1028 if (iface)
1029 netmask = iface->netmask;
1030 else
1031 dst_addr_4.s_addr = 0;
1032 }
1033 }
1034
1035 if (extract_request(header, (size_t)n, daemon->namebuff, &type))
1036 {
1037 char types[20];
1038 #ifdef HAVE_AUTH
1039 struct auth_zone *zone;
1040 #endif
1041
1042 querystr(auth_dns ? "auth" : "query", types, type);
1043
1044 if (listen->family == AF_INET)
1045 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
1046 (struct all_addr *)&source_addr.in.sin_addr, types);
1047 #ifdef HAVE_IPV6
1048 else
1049 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
1050 (struct all_addr *)&source_addr.in6.sin6_addr, types);
1051 #endif
1052
1053 #ifdef HAVE_AUTH
1054 /* find queries for zones we're authoritative for, and answer them directly */
1055 if (!auth_dns)
1056 for (zone = daemon->auth_zones; zone; zone = zone->next)
1057 if (in_zone(zone, daemon->namebuff, NULL))
1058 {
1059 auth_dns = 1;
1060 local_auth = 1;
1061 break;
1062 }
1063 #endif
1064 }
1065
1066 #ifdef HAVE_AUTH
1067 if (auth_dns)
1068 {
1069 m = answer_auth(header, ((char *) header) + daemon->packet_buff_sz, (size_t)n, now, &source_addr, local_auth);
1070 if (m >= 1)
1071 {
1072 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
1073 (char *)header, m, &source_addr, &dst_addr, if_index);
1074 daemon->auth_answer++;
1075 }
1076 }
1077 else
1078 #endif
1079 {
1080 m = answer_request(header, ((char *) header) + daemon->packet_buff_sz, (size_t)n,
1081 dst_addr_4, netmask, now);
1082
1083 if (m >= 1)
1084 {
1085 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
1086 (char *)header, m, &source_addr, &dst_addr, if_index);
1087 daemon->local_answer++;
1088 }
1089 else if (forward_query(listen->fd, &source_addr, &dst_addr, if_index,
1090 header, (size_t)n, now, NULL))
1091 daemon->queries_forwarded++;
1092 else
1093 daemon->local_answer++;
1094 }
1095 }
1096
1097 #ifdef HAVE_DNSSEC
1098 static int tcp_key_recurse(time_t now, int status, int class, char *keyname, struct server *server)
1099 {
1100 /* Recurse up the key heirarchy */
1101 size_t n;
1102 unsigned char *packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16));
1103 unsigned char *payload = &packet[2];
1104 struct dns_header *header = (struct dns_header *)payload;
1105 u16 *length = (u16 *)packet;
1106 int new_status;
1107 unsigned char c1, c2;
1108
1109 n = dnssec_generate_query(header, ((char *) header) + 65536, keyname, class,
1110 status == STAT_NEED_KEY ? T_DNSKEY : T_DS, &server->addr);
1111
1112 *length = htons(n);
1113
1114 if (!read_write(server->tcpfd, packet, n + sizeof(u16), 0) ||
1115 !read_write(server->tcpfd, &c1, 1, 1) ||
1116 !read_write(server->tcpfd, &c2, 1, 1) ||
1117 !read_write(server->tcpfd, payload, (c1 << 8) | c2, 1))
1118 {
1119 close(server->tcpfd);
1120 server->tcpfd = -1;
1121 new_status = STAT_INSECURE;
1122 }
1123 else
1124 {
1125 n = (c1 << 8) | c2;
1126
1127 if (status == STAT_NEED_KEY)
1128 new_status = dnssec_validate_by_ds(now, header, n, daemon->namebuff, daemon->keyname, class);
1129 else
1130 new_status = dnssec_validate_ds(now, header, n, daemon->namebuff, daemon->keyname, class);
1131
1132 if (new_status == STAT_NEED_DS || new_status == STAT_NEED_KEY)
1133 {
1134 if ((new_status = tcp_key_recurse(now, new_status, class, daemon->keyname, server) == STAT_SECURE))
1135 {
1136 if (status == STAT_NEED_KEY)
1137 new_status = dnssec_validate_by_ds(now, header, n, daemon->namebuff, daemon->keyname, class);
1138 else
1139 new_status = dnssec_validate_ds(now, header, n, daemon->namebuff, daemon->keyname, class);
1140
1141 if (new_status == STAT_NEED_DS || new_status == STAT_NEED_KEY)
1142 {
1143 my_syslog(LOG_ERR, _("Unexpected missing data for DNSSEC validation"));
1144 status = STAT_INSECURE;
1145 }
1146 }
1147 }
1148 }
1149
1150 free(packet);
1151
1152 return new_status;
1153 }
1154 #endif
1155
1156
1157 /* The daemon forks before calling this: it should deal with one connection,
1158 blocking as neccessary, and then return. Note, need to be a bit careful
1159 about resources for debug mode, when the fork is suppressed: that's
1160 done by the caller. */
1161 unsigned char *tcp_request(int confd, time_t now,
1162 union mysockaddr *local_addr, struct in_addr netmask, int auth_dns)
1163 {
1164 size_t size = 0;
1165 int norebind = 0;
1166 #ifdef HAVE_AUTH
1167 int local_auth = 0;
1168 #endif
1169 int checking_disabled, check_subnet, no_cache_dnssec = 0, cache_secure = 0;
1170 size_t m;
1171 unsigned short qtype;
1172 unsigned int gotname;
1173 unsigned char c1, c2;
1174 /* Max TCP packet + slop + size */
1175 unsigned char *packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16));
1176 unsigned char *payload = &packet[2];
1177 /* largest field in header is 16-bits, so this is still sufficiently aligned */
1178 struct dns_header *header = (struct dns_header *)payload;
1179 u16 *length = (u16 *)packet;
1180 struct server *last_server;
1181 struct in_addr dst_addr_4;
1182 union mysockaddr peer_addr;
1183 socklen_t peer_len = sizeof(union mysockaddr);
1184
1185 if (getpeername(confd, (struct sockaddr *)&peer_addr, &peer_len) == -1)
1186 return packet;
1187
1188 while (1)
1189 {
1190 if (!packet ||
1191 !read_write(confd, &c1, 1, 1) || !read_write(confd, &c2, 1, 1) ||
1192 !(size = c1 << 8 | c2) ||
1193 !read_write(confd, payload, size, 1))
1194 return packet;
1195
1196 if (size < (int)sizeof(struct dns_header))
1197 continue;
1198
1199 check_subnet = 0;
1200
1201 /* save state of "cd" flag in query */
1202 if ((checking_disabled = header->hb4 & HB4_CD))
1203 no_cache_dnssec = 1;
1204
1205 /* RFC 4035: sect 4.6 para 2 */
1206 header->hb4 &= ~HB4_AD;
1207
1208 if ((gotname = extract_request(header, (unsigned int)size, daemon->namebuff, &qtype)))
1209 {
1210 char types[20];
1211 #ifdef HAVE_AUTH
1212 struct auth_zone *zone;
1213 #endif
1214 querystr(auth_dns ? "auth" : "query", types, qtype);
1215
1216 if (peer_addr.sa.sa_family == AF_INET)
1217 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
1218 (struct all_addr *)&peer_addr.in.sin_addr, types);
1219 #ifdef HAVE_IPV6
1220 else
1221 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
1222 (struct all_addr *)&peer_addr.in6.sin6_addr, types);
1223 #endif
1224
1225 #ifdef HAVE_AUTH
1226 /* find queries for zones we're authoritative for, and answer them directly */
1227 if (!auth_dns)
1228 for (zone = daemon->auth_zones; zone; zone = zone->next)
1229 if (in_zone(zone, daemon->namebuff, NULL))
1230 {
1231 auth_dns = 1;
1232 local_auth = 1;
1233 break;
1234 }
1235 #endif
1236 }
1237
1238 if (local_addr->sa.sa_family == AF_INET)
1239 dst_addr_4 = local_addr->in.sin_addr;
1240 else
1241 dst_addr_4.s_addr = 0;
1242
1243 #ifdef HAVE_AUTH
1244 if (auth_dns)
1245 m = answer_auth(header, ((char *) header) + 65536, (size_t)size, now, &peer_addr, local_auth);
1246 else
1247 #endif
1248 {
1249 /* m > 0 if answered from cache */
1250 m = answer_request(header, ((char *) header) + 65536, (size_t)size,
1251 dst_addr_4, netmask, now);
1252
1253 /* Do this by steam now we're not in the select() loop */
1254 check_log_writer(NULL);
1255
1256 if (m == 0)
1257 {
1258 unsigned int flags = 0;
1259 struct all_addr *addrp = NULL;
1260 int type = 0;
1261 char *domain = NULL;
1262
1263 if (option_bool(OPT_ADD_MAC))
1264 size = add_mac(header, size, ((char *) header) + 65536, &peer_addr);
1265
1266 if (option_bool(OPT_CLIENT_SUBNET))
1267 {
1268 size_t new = add_source_addr(header, size, ((char *) header) + 65536, &peer_addr);
1269 if (size != new)
1270 {
1271 size = new;
1272 check_subnet = 1;
1273 }
1274 }
1275
1276 if (gotname)
1277 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
1278
1279 if (type != 0 || option_bool(OPT_ORDER) || !daemon->last_server)
1280 last_server = daemon->servers;
1281 else
1282 last_server = daemon->last_server;
1283
1284 if (!flags && last_server)
1285 {
1286 struct server *firstsendto = NULL;
1287 unsigned int crc = questions_crc(header, (unsigned int)size, daemon->namebuff);
1288
1289 /* Loop round available servers until we succeed in connecting to one.
1290 Note that this code subtley ensures that consecutive queries on this connection
1291 which can go to the same server, do so. */
1292 while (1)
1293 {
1294 if (!firstsendto)
1295 firstsendto = last_server;
1296 else
1297 {
1298 if (!(last_server = last_server->next))
1299 last_server = daemon->servers;
1300
1301 if (last_server == firstsendto)
1302 break;
1303 }
1304
1305 /* server for wrong domain */
1306 if (type != (last_server->flags & SERV_TYPE) ||
1307 (type == SERV_HAS_DOMAIN && !hostname_isequal(domain, last_server->domain)))
1308 continue;
1309
1310 if (last_server->tcpfd == -1)
1311 {
1312 if ((last_server->tcpfd = socket(last_server->addr.sa.sa_family, SOCK_STREAM, 0)) == -1)
1313 continue;
1314
1315 if ((!local_bind(last_server->tcpfd, &last_server->source_addr, last_server->interface, 1) ||
1316 connect(last_server->tcpfd, &last_server->addr.sa, sa_len(&last_server->addr)) == -1))
1317 {
1318 close(last_server->tcpfd);
1319 last_server->tcpfd = -1;
1320 continue;
1321 }
1322
1323 #ifdef HAVE_DNSSEC
1324 if (option_bool(OPT_DNSSEC_VALID))
1325 {
1326 size = add_do_bit(header, size, ((char *) header) + 65536);
1327 header->hb4 |= HB4_CD;
1328 }
1329 #endif
1330
1331 #ifdef HAVE_CONNTRACK
1332 /* Copy connection mark of incoming query to outgoing connection. */
1333 if (option_bool(OPT_CONNTRACK))
1334 {
1335 unsigned int mark;
1336 struct all_addr local;
1337 #ifdef HAVE_IPV6
1338 if (local_addr->sa.sa_family == AF_INET6)
1339 local.addr.addr6 = local_addr->in6.sin6_addr;
1340 else
1341 #endif
1342 local.addr.addr4 = local_addr->in.sin_addr;
1343
1344 if (get_incoming_mark(&peer_addr, &local, 1, &mark))
1345 setsockopt(last_server->tcpfd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
1346 }
1347 #endif
1348 }
1349
1350 *length = htons(size);
1351
1352 if (!read_write(last_server->tcpfd, packet, size + sizeof(u16), 0) ||
1353 !read_write(last_server->tcpfd, &c1, 1, 1) ||
1354 !read_write(last_server->tcpfd, &c2, 1, 1) ||
1355 !read_write(last_server->tcpfd, payload, (c1 << 8) | c2, 1))
1356 {
1357 close(last_server->tcpfd);
1358 last_server->tcpfd = -1;
1359 continue;
1360 }
1361
1362 m = (c1 << 8) | c2;
1363
1364 if (!gotname)
1365 strcpy(daemon->namebuff, "query");
1366 if (last_server->addr.sa.sa_family == AF_INET)
1367 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
1368 (struct all_addr *)&last_server->addr.in.sin_addr, NULL);
1369 #ifdef HAVE_IPV6
1370 else
1371 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
1372 (struct all_addr *)&last_server->addr.in6.sin6_addr, NULL);
1373 #endif
1374
1375 #ifdef HAVE_DNSSEC
1376 if (option_bool(OPT_DNSSEC_VALID) && !checking_disabled)
1377 {
1378 int class, status;
1379
1380 status = dnssec_validate_reply(now, header, m, daemon->namebuff, daemon->keyname, &class);
1381
1382 if (status == STAT_NEED_DS || status == STAT_NEED_KEY)
1383 {
1384 if ((status = tcp_key_recurse(now, status, class, daemon->keyname, last_server)) == STAT_SECURE)
1385 status = dnssec_validate_reply(now, header, m, daemon->namebuff, daemon->keyname, &class);
1386 }
1387
1388 log_query(F_KEYTAG | F_SECSTAT, "result", NULL,
1389 status == STAT_SECURE ? "SECURE" : (status == STAT_INSECURE ? "INSECURE" : "BOGUS"));
1390
1391 if (status == STAT_BOGUS)
1392 no_cache_dnssec = 1;
1393
1394 if (status == STAT_SECURE)
1395 cache_secure = 1;
1396 }
1397 #endif
1398
1399 /* restore CD bit to the value in the query */
1400 if (checking_disabled)
1401 header->hb4 |= HB4_CD;
1402 else
1403 header->hb4 &= ~HB4_CD;
1404
1405 /* There's no point in updating the cache, since this process will exit and
1406 lose the information after a few queries. We make this call for the alias and
1407 bogus-nxdomain side-effects. */
1408 /* If the crc of the question section doesn't match the crc we sent, then
1409 someone might be attempting to insert bogus values into the cache by
1410 sending replies containing questions and bogus answers. */
1411 if (crc == questions_crc(header, (unsigned int)m, daemon->namebuff))
1412 m = process_reply(header, now, last_server, (unsigned int)m,
1413 option_bool(OPT_NO_REBIND) && !norebind, no_cache_dnssec,
1414 cache_secure, check_subnet, &peer_addr);
1415
1416 break;
1417 }
1418 }
1419
1420 /* In case of local answer or no connections made. */
1421 if (m == 0)
1422 m = setup_reply(header, (unsigned int)size, addrp, flags, daemon->local_ttl);
1423 }
1424 }
1425
1426 check_log_writer(NULL);
1427
1428 *length = htons(m);
1429
1430 if (m == 0 || !read_write(confd, packet, m + sizeof(u16), 0))
1431 return packet;
1432 }
1433 }
1434
1435 static struct frec *allocate_frec(time_t now)
1436 {
1437 struct frec *f;
1438
1439 if ((f = (struct frec *)whine_malloc(sizeof(struct frec))))
1440 {
1441 f->next = daemon->frec_list;
1442 f->time = now;
1443 f->sentto = NULL;
1444 f->rfd4 = NULL;
1445 f->flags = 0;
1446 #ifdef HAVE_IPV6
1447 f->rfd6 = NULL;
1448 #endif
1449 #ifdef HAVE_DNSSEC
1450 f->blocking_query = NULL;
1451 #endif
1452 daemon->frec_list = f;
1453 }
1454
1455 return f;
1456 }
1457
1458 static struct randfd *allocate_rfd(int family)
1459 {
1460 static int finger = 0;
1461 int i;
1462
1463 /* limit the number of sockets we have open to avoid starvation of
1464 (eg) TFTP. Once we have a reasonable number, randomness should be OK */
1465
1466 for (i = 0; i < RANDOM_SOCKS; i++)
1467 if (daemon->randomsocks[i].refcount == 0)
1468 {
1469 if ((daemon->randomsocks[i].fd = random_sock(family)) == -1)
1470 break;
1471
1472 daemon->randomsocks[i].refcount = 1;
1473 daemon->randomsocks[i].family = family;
1474 return &daemon->randomsocks[i];
1475 }
1476
1477 /* No free ones or cannot get new socket, grab an existing one */
1478 for (i = 0; i < RANDOM_SOCKS; i++)
1479 {
1480 int j = (i+finger) % RANDOM_SOCKS;
1481 if (daemon->randomsocks[j].refcount != 0 &&
1482 daemon->randomsocks[j].family == family &&
1483 daemon->randomsocks[j].refcount != 0xffff)
1484 {
1485 finger = j;
1486 daemon->randomsocks[j].refcount++;
1487 return &daemon->randomsocks[j];
1488 }
1489 }
1490
1491 return NULL; /* doom */
1492 }
1493 static void free_frec(struct frec *f)
1494 {
1495 if (f->rfd4 && --(f->rfd4->refcount) == 0)
1496 close(f->rfd4->fd);
1497
1498 f->rfd4 = NULL;
1499 f->sentto = NULL;
1500 f->flags = 0;
1501
1502 #ifdef HAVE_IPV6
1503 if (f->rfd6 && --(f->rfd6->refcount) == 0)
1504 close(f->rfd6->fd);
1505
1506 f->rfd6 = NULL;
1507 #endif
1508
1509 #ifdef HAVE_DNSSEC
1510 if (f->stash)
1511 {
1512 blockdata_free(f->stash);
1513 f->stash = NULL;
1514 }
1515
1516 /* Anything we're waiting on is pointless now, too */
1517 if (f->blocking_query)
1518 free_frec(f->blocking_query);
1519 f->blocking_query = NULL;
1520
1521 #endif
1522 }
1523
1524 /* if wait==NULL return a free or older than TIMEOUT record.
1525 else return *wait zero if one available, or *wait is delay to
1526 when the oldest in-use record will expire. Impose an absolute
1527 limit of 4*TIMEOUT before we wipe things (for random sockets).
1528 If force is set, always return a result, even if we have
1529 to allocate above the limit. */
1530 struct frec *get_new_frec(time_t now, int *wait, int force)
1531 {
1532 struct frec *f, *oldest, *target;
1533 int count;
1534
1535 if (wait)
1536 *wait = 0;
1537
1538 for (f = daemon->frec_list, oldest = NULL, target = NULL, count = 0; f; f = f->next, count++)
1539 if (!f->sentto)
1540 target = f;
1541 else
1542 {
1543 if (difftime(now, f->time) >= 4*TIMEOUT)
1544 {
1545 free_frec(f);
1546 target = f;
1547 }
1548
1549 if (!oldest || difftime(f->time, oldest->time) <= 0)
1550 oldest = f;
1551 }
1552
1553 if (target)
1554 {
1555 target->time = now;
1556 return target;
1557 }
1558
1559 /* can't find empty one, use oldest if there is one
1560 and it's older than timeout */
1561 if (oldest && ((int)difftime(now, oldest->time)) >= TIMEOUT)
1562 {
1563 /* keep stuff for twice timeout if we can by allocating a new
1564 record instead */
1565 if (difftime(now, oldest->time) < 2*TIMEOUT &&
1566 count <= daemon->ftabsize &&
1567 (f = allocate_frec(now)))
1568 return f;
1569
1570 if (!wait)
1571 {
1572 free_frec(oldest);
1573 oldest->time = now;
1574 }
1575 return oldest;
1576 }
1577
1578 /* none available, calculate time 'till oldest record expires */
1579 if (!force && count > daemon->ftabsize)
1580 {
1581 static time_t last_log = 0;
1582
1583 if (oldest && wait)
1584 *wait = oldest->time + (time_t)TIMEOUT - now;
1585
1586 if ((int)difftime(now, last_log) > 5)
1587 {
1588 last_log = now;
1589 my_syslog(LOG_WARNING, _("Maximum number of concurrent DNS queries reached (max: %d)"), daemon->ftabsize);
1590 }
1591
1592 return NULL;
1593 }
1594
1595 if (!(f = allocate_frec(now)) && wait)
1596 /* wait one second on malloc failure */
1597 *wait = 1;
1598
1599 return f; /* OK if malloc fails and this is NULL */
1600 }
1601
1602 /* crc is all-ones if not known. */
1603 static struct frec *lookup_frec(unsigned short id, unsigned int crc)
1604 {
1605 struct frec *f;
1606
1607 for(f = daemon->frec_list; f; f = f->next)
1608 if (f->sentto && f->new_id == id &&
1609 (f->crc == crc || crc == 0xffffffff))
1610 return f;
1611
1612 return NULL;
1613 }
1614
1615 static struct frec *lookup_frec_by_sender(unsigned short id,
1616 union mysockaddr *addr,
1617 unsigned int crc)
1618 {
1619 struct frec *f;
1620
1621 for(f = daemon->frec_list; f; f = f->next)
1622 if (f->sentto &&
1623 f->orig_id == id &&
1624 f->crc == crc &&
1625 sockaddr_isequal(&f->source, addr))
1626 return f;
1627
1628 return NULL;
1629 }
1630
1631 /* A server record is going away, remove references to it */
1632 void server_gone(struct server *server)
1633 {
1634 struct frec *f;
1635
1636 for (f = daemon->frec_list; f; f = f->next)
1637 if (f->sentto && f->sentto == server)
1638 free_frec(f);
1639
1640 if (daemon->last_server == server)
1641 daemon->last_server = NULL;
1642
1643 if (daemon->srv_save == server)
1644 daemon->srv_save = NULL;
1645 }
1646
1647 /* return unique random ids. */
1648 static unsigned short get_id(unsigned int crc)
1649 {
1650 unsigned short ret = 0;
1651
1652 do
1653 ret = rand16();
1654 while (lookup_frec(ret, crc));
1655
1656 return ret;
1657 }
1658
1659
1660
1661
1662