]> git.ipfire.org Git - people/ms/dnsmasq.git/blob - src/forward.c
Terminate DS-search when reaching the root via cache entries.
[people/ms/dnsmasq.git] / src / forward.c
1 /* dnsmasq is Copyright (c) 2000-2014 Simon Kelley
2
3 This program is free software; you can redistribute it and/or modify
4 it under the terms of the GNU General Public License as published by
5 the Free Software Foundation; version 2 dated June, 1991, or
6 (at your option) version 3 dated 29 June, 2007.
7
8 This program is distributed in the hope that it will be useful,
9 but WITHOUT ANY WARRANTY; without even the implied warranty of
10 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11 GNU General Public License for more details.
12
13 You should have received a copy of the GNU General Public License
14 along with this program. If not, see <http://www.gnu.org/licenses/>.
15 */
16
17 #include "dnsmasq.h"
18
19 static struct frec *lookup_frec(unsigned short id, void *hash);
20 static struct frec *lookup_frec_by_sender(unsigned short id,
21 union mysockaddr *addr,
22 void *hash);
23 static unsigned short get_id(void);
24 static void free_frec(struct frec *f);
25 static struct randfd *allocate_rfd(int family);
26
27 #ifdef HAVE_DNSSEC
28 static int tcp_key_recurse(time_t now, int status, struct dns_header *header, size_t n,
29 int class, char *name, char *keyname, struct server *server, int *keycount);
30 static int do_check_sign(time_t now, struct dns_header *header, size_t plen, char *name, char *keyname, int class);
31 static int send_check_sign(time_t now, struct dns_header *header, size_t plen, char *name, char *keyname);
32 #endif
33
34
35 /* Send a UDP packet with its source address set as "source"
36 unless nowild is true, when we just send it with the kernel default */
37 int send_from(int fd, int nowild, char *packet, size_t len,
38 union mysockaddr *to, struct all_addr *source,
39 unsigned int iface)
40 {
41 struct msghdr msg;
42 struct iovec iov[1];
43 union {
44 struct cmsghdr align; /* this ensures alignment */
45 #if defined(HAVE_LINUX_NETWORK)
46 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
47 #elif defined(IP_SENDSRCADDR)
48 char control[CMSG_SPACE(sizeof(struct in_addr))];
49 #endif
50 #ifdef HAVE_IPV6
51 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
52 #endif
53 } control_u;
54
55 iov[0].iov_base = packet;
56 iov[0].iov_len = len;
57
58 msg.msg_control = NULL;
59 msg.msg_controllen = 0;
60 msg.msg_flags = 0;
61 msg.msg_name = to;
62 msg.msg_namelen = sa_len(to);
63 msg.msg_iov = iov;
64 msg.msg_iovlen = 1;
65
66 if (!nowild)
67 {
68 struct cmsghdr *cmptr;
69 msg.msg_control = &control_u;
70 msg.msg_controllen = sizeof(control_u);
71 cmptr = CMSG_FIRSTHDR(&msg);
72
73 if (to->sa.sa_family == AF_INET)
74 {
75 #if defined(HAVE_LINUX_NETWORK)
76 struct in_pktinfo p;
77 p.ipi_ifindex = 0;
78 p.ipi_spec_dst = source->addr.addr4;
79 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
80 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_pktinfo));
81 cmptr->cmsg_level = IPPROTO_IP;
82 cmptr->cmsg_type = IP_PKTINFO;
83 #elif defined(IP_SENDSRCADDR)
84 memcpy(CMSG_DATA(cmptr), &(source->addr.addr4), sizeof(source->addr.addr4));
85 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_addr));
86 cmptr->cmsg_level = IPPROTO_IP;
87 cmptr->cmsg_type = IP_SENDSRCADDR;
88 #endif
89 }
90 else
91 #ifdef HAVE_IPV6
92 {
93 struct in6_pktinfo p;
94 p.ipi6_ifindex = iface; /* Need iface for IPv6 to handle link-local addrs */
95 p.ipi6_addr = source->addr.addr6;
96 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
97 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in6_pktinfo));
98 cmptr->cmsg_type = daemon->v6pktinfo;
99 cmptr->cmsg_level = IPPROTO_IPV6;
100 }
101 #else
102 (void)iface; /* eliminate warning */
103 #endif
104 }
105
106 while (sendmsg(fd, &msg, 0) == -1)
107 {
108 if (retry_send())
109 continue;
110
111 /* If interface is still in DAD, EINVAL results - ignore that. */
112 if (errno == EINVAL)
113 break;
114
115 my_syslog(LOG_ERR, _("failed to send packet: %s"), strerror(errno));
116 return 0;
117 }
118
119 return 1;
120 }
121
122 static unsigned int search_servers(time_t now, struct all_addr **addrpp,
123 unsigned int qtype, char *qdomain, int *type, char **domain, int *norebind)
124
125 {
126 /* If the query ends in the domain in one of our servers, set
127 domain to point to that name. We find the largest match to allow both
128 domain.org and sub.domain.org to exist. */
129
130 unsigned int namelen = strlen(qdomain);
131 unsigned int matchlen = 0;
132 struct server *serv;
133 unsigned int flags = 0;
134
135 for (serv = daemon->servers; serv; serv=serv->next)
136 /* domain matches take priority over NODOTS matches */
137 if ((serv->flags & SERV_FOR_NODOTS) && *type != SERV_HAS_DOMAIN && !strchr(qdomain, '.') && namelen != 0)
138 {
139 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
140 *type = SERV_FOR_NODOTS;
141 if (serv->flags & SERV_NO_ADDR)
142 flags = F_NXDOMAIN;
143 else if (serv->flags & SERV_LITERAL_ADDRESS)
144 {
145 if (sflag & qtype)
146 {
147 flags = sflag;
148 if (serv->addr.sa.sa_family == AF_INET)
149 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
150 #ifdef HAVE_IPV6
151 else
152 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
153 #endif
154 }
155 else if (!flags || (flags & F_NXDOMAIN))
156 flags = F_NOERR;
157 }
158 }
159 else if (serv->flags & SERV_HAS_DOMAIN)
160 {
161 unsigned int domainlen = strlen(serv->domain);
162 char *matchstart = qdomain + namelen - domainlen;
163 if (namelen >= domainlen &&
164 hostname_isequal(matchstart, serv->domain) &&
165 (domainlen == 0 || namelen == domainlen || *(matchstart-1) == '.' ))
166 {
167 if (serv->flags & SERV_NO_REBIND)
168 *norebind = 1;
169 else
170 {
171 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
172 /* implement priority rules for --address and --server for same domain.
173 --address wins if the address is for the correct AF
174 --server wins otherwise. */
175 if (domainlen != 0 && domainlen == matchlen)
176 {
177 if ((serv->flags & SERV_LITERAL_ADDRESS))
178 {
179 if (!(sflag & qtype) && flags == 0)
180 continue;
181 }
182 else
183 {
184 if (flags & (F_IPV4 | F_IPV6))
185 continue;
186 }
187 }
188
189 if (domainlen >= matchlen)
190 {
191 *type = serv->flags & (SERV_HAS_DOMAIN | SERV_USE_RESOLV | SERV_NO_REBIND);
192 *domain = serv->domain;
193 matchlen = domainlen;
194 if (serv->flags & SERV_NO_ADDR)
195 flags = F_NXDOMAIN;
196 else if (serv->flags & SERV_LITERAL_ADDRESS)
197 {
198 if (sflag & qtype)
199 {
200 flags = sflag;
201 if (serv->addr.sa.sa_family == AF_INET)
202 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
203 #ifdef HAVE_IPV6
204 else
205 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
206 #endif
207 }
208 else if (!flags || (flags & F_NXDOMAIN))
209 flags = F_NOERR;
210 }
211 else
212 flags = 0;
213 }
214 }
215 }
216 }
217
218 if (flags == 0 && !(qtype & F_QUERY) &&
219 option_bool(OPT_NODOTS_LOCAL) && !strchr(qdomain, '.') && namelen != 0)
220 /* don't forward A or AAAA queries for simple names, except the empty name */
221 flags = F_NOERR;
222
223 if (flags == F_NXDOMAIN && check_for_local_domain(qdomain, now))
224 flags = F_NOERR;
225
226 if (flags)
227 {
228 int logflags = 0;
229
230 if (flags == F_NXDOMAIN || flags == F_NOERR)
231 logflags = F_NEG | qtype;
232
233 log_query(logflags | flags | F_CONFIG | F_FORWARD, qdomain, *addrpp, NULL);
234 }
235 else if ((*type) & SERV_USE_RESOLV)
236 {
237 *type = 0; /* use normal servers for this domain */
238 *domain = NULL;
239 }
240 return flags;
241 }
242
243 static int forward_query(int udpfd, union mysockaddr *udpaddr,
244 struct all_addr *dst_addr, unsigned int dst_iface,
245 struct dns_header *header, size_t plen, time_t now,
246 struct frec *forward, int ad_reqd, int do_bit)
247 {
248 char *domain = NULL;
249 int type = 0, norebind = 0;
250 struct all_addr *addrp = NULL;
251 unsigned int flags = 0;
252 struct server *start = NULL;
253 #ifdef HAVE_DNSSEC
254 void *hash = hash_questions(header, plen, daemon->namebuff);
255 #else
256 unsigned int crc = questions_crc(header, plen, daemon->namebuff);
257 void *hash = &crc;
258 #endif
259 unsigned int gotname = extract_request(header, plen, daemon->namebuff, NULL);
260
261 (void)do_bit;
262
263 /* may be no servers available. */
264 if (!daemon->servers)
265 forward = NULL;
266 else if (forward || (hash && (forward = lookup_frec_by_sender(ntohs(header->id), udpaddr, hash))))
267 {
268 #ifdef HAVE_DNSSEC
269 /* If we've already got an answer to this query, but we're awaiting keys for validation,
270 there's no point retrying the query, retry the key query instead...... */
271 if (forward->blocking_query)
272 {
273 int fd;
274
275 while (forward->blocking_query)
276 forward = forward->blocking_query;
277
278 blockdata_retrieve(forward->stash, forward->stash_len, (void *)header);
279 plen = forward->stash_len;
280
281 if (forward->sentto->addr.sa.sa_family == AF_INET)
282 log_query(F_DNSSEC | F_IPV4, "retry", (struct all_addr *)&forward->sentto->addr.in.sin_addr, "dnssec");
283 #ifdef HAVE_IPV6
284 else
285 log_query(F_DNSSEC | F_IPV6, "retry", (struct all_addr *)&forward->sentto->addr.in6.sin6_addr, "dnssec");
286 #endif
287
288 if (forward->sentto->sfd)
289 fd = forward->sentto->sfd->fd;
290 else
291 {
292 #ifdef HAVE_IPV6
293 if (forward->sentto->addr.sa.sa_family == AF_INET6)
294 fd = forward->rfd6->fd;
295 else
296 #endif
297 fd = forward->rfd4->fd;
298 }
299
300 while (sendto(fd, (char *)header, plen, 0,
301 &forward->sentto->addr.sa,
302 sa_len(&forward->sentto->addr)) == -1 && retry_send());
303
304 return 1;
305 }
306 #endif
307
308 /* retry on existing query, send to all available servers */
309 domain = forward->sentto->domain;
310 forward->sentto->failed_queries++;
311 if (!option_bool(OPT_ORDER))
312 {
313 forward->forwardall = 1;
314 daemon->last_server = NULL;
315 }
316 type = forward->sentto->flags & SERV_TYPE;
317 if (!(start = forward->sentto->next))
318 start = daemon->servers; /* at end of list, recycle */
319 header->id = htons(forward->new_id);
320 }
321 else
322 {
323 if (gotname)
324 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
325
326 if (!flags && !(forward = get_new_frec(now, NULL, 0)))
327 /* table full - server failure. */
328 flags = F_NEG;
329
330 if (forward)
331 {
332 forward->source = *udpaddr;
333 forward->dest = *dst_addr;
334 forward->iface = dst_iface;
335 forward->orig_id = ntohs(header->id);
336 forward->new_id = get_id();
337 forward->fd = udpfd;
338 memcpy(forward->hash, hash, HASH_SIZE);
339 forward->forwardall = 0;
340 forward->flags = 0;
341 if (norebind)
342 forward->flags |= FREC_NOREBIND;
343 if (header->hb4 & HB4_CD)
344 forward->flags |= FREC_CHECKING_DISABLED;
345 if (ad_reqd)
346 forward->flags |= FREC_AD_QUESTION;
347 #ifdef HAVE_DNSSEC
348 forward->work_counter = DNSSEC_WORK;
349 if (do_bit)
350 forward->flags |= FREC_DO_QUESTION;
351 #endif
352
353 header->id = htons(forward->new_id);
354
355 /* In strict_order mode, always try servers in the order
356 specified in resolv.conf, if a domain is given
357 always try all the available servers,
358 otherwise, use the one last known to work. */
359
360 if (type == 0)
361 {
362 if (option_bool(OPT_ORDER))
363 start = daemon->servers;
364 else if (!(start = daemon->last_server) ||
365 daemon->forwardcount++ > FORWARD_TEST ||
366 difftime(now, daemon->forwardtime) > FORWARD_TIME)
367 {
368 start = daemon->servers;
369 forward->forwardall = 1;
370 daemon->forwardcount = 0;
371 daemon->forwardtime = now;
372 }
373 }
374 else
375 {
376 start = daemon->servers;
377 if (!option_bool(OPT_ORDER))
378 forward->forwardall = 1;
379 }
380 }
381 }
382
383 /* check for send errors here (no route to host)
384 if we fail to send to all nameservers, send back an error
385 packet straight away (helps modem users when offline) */
386
387 if (!flags && forward)
388 {
389 struct server *firstsentto = start;
390 int forwarded = 0;
391
392 if (option_bool(OPT_ADD_MAC))
393 plen = add_mac(header, plen, ((char *) header) + daemon->packet_buff_sz, &forward->source);
394
395 if (option_bool(OPT_CLIENT_SUBNET))
396 {
397 size_t new = add_source_addr(header, plen, ((char *) header) + daemon->packet_buff_sz, &forward->source);
398 if (new != plen)
399 {
400 plen = new;
401 forward->flags |= FREC_HAS_SUBNET;
402 }
403 }
404
405 #ifdef HAVE_DNSSEC
406 if (option_bool(OPT_DNSSEC_VALID))
407 {
408 size_t new_plen = add_do_bit(header, plen, ((char *) header) + daemon->packet_buff_sz);
409
410 /* For debugging, set Checking Disabled, otherwise, have the upstream check too,
411 this allows it to select auth servers when one is returning bad data. */
412 if (option_bool(OPT_DNSSEC_DEBUG))
413 header->hb4 |= HB4_CD;
414
415 if (new_plen != plen)
416 forward->flags |= FREC_ADDED_PHEADER;
417
418 plen = new_plen;
419 }
420 #endif
421
422 while (1)
423 {
424 /* only send to servers dealing with our domain.
425 domain may be NULL, in which case server->domain
426 must be NULL also. */
427
428 if (type == (start->flags & SERV_TYPE) &&
429 (type != SERV_HAS_DOMAIN || hostname_isequal(domain, start->domain)) &&
430 !(start->flags & SERV_LITERAL_ADDRESS))
431 {
432 int fd;
433
434 /* find server socket to use, may need to get random one. */
435 if (start->sfd)
436 fd = start->sfd->fd;
437 else
438 {
439 #ifdef HAVE_IPV6
440 if (start->addr.sa.sa_family == AF_INET6)
441 {
442 if (!forward->rfd6 &&
443 !(forward->rfd6 = allocate_rfd(AF_INET6)))
444 break;
445 daemon->rfd_save = forward->rfd6;
446 fd = forward->rfd6->fd;
447 }
448 else
449 #endif
450 {
451 if (!forward->rfd4 &&
452 !(forward->rfd4 = allocate_rfd(AF_INET)))
453 break;
454 daemon->rfd_save = forward->rfd4;
455 fd = forward->rfd4->fd;
456 }
457
458 #ifdef HAVE_CONNTRACK
459 /* Copy connection mark of incoming query to outgoing connection. */
460 if (option_bool(OPT_CONNTRACK))
461 {
462 unsigned int mark;
463 if (get_incoming_mark(&forward->source, &forward->dest, 0, &mark))
464 setsockopt(fd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
465 }
466 #endif
467 }
468
469 if (sendto(fd, (char *)header, plen, 0,
470 &start->addr.sa,
471 sa_len(&start->addr)) == -1)
472 {
473 if (retry_send())
474 continue;
475 }
476 else
477 {
478 /* Keep info in case we want to re-send this packet */
479 daemon->srv_save = start;
480 daemon->packet_len = plen;
481
482 if (!gotname)
483 strcpy(daemon->namebuff, "query");
484 if (start->addr.sa.sa_family == AF_INET)
485 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
486 (struct all_addr *)&start->addr.in.sin_addr, NULL);
487 #ifdef HAVE_IPV6
488 else
489 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
490 (struct all_addr *)&start->addr.in6.sin6_addr, NULL);
491 #endif
492 start->queries++;
493 forwarded = 1;
494 forward->sentto = start;
495 if (!forward->forwardall)
496 break;
497 forward->forwardall++;
498 }
499 }
500
501 if (!(start = start->next))
502 start = daemon->servers;
503
504 if (start == firstsentto)
505 break;
506 }
507
508 if (forwarded)
509 return 1;
510
511 /* could not send on, prepare to return */
512 header->id = htons(forward->orig_id);
513 free_frec(forward); /* cancel */
514 }
515
516 /* could not send on, return empty answer or address if known for whole domain */
517 if (udpfd != -1)
518 {
519 plen = setup_reply(header, plen, addrp, flags, daemon->local_ttl);
520 send_from(udpfd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND), (char *)header, plen, udpaddr, dst_addr, dst_iface);
521 }
522
523 return 0;
524 }
525
526 static size_t process_reply(struct dns_header *header, time_t now, struct server *server, size_t n, int check_rebind,
527 int no_cache, int cache_secure, int ad_reqd, int do_bit, int added_pheader, int check_subnet, union mysockaddr *query_source)
528 {
529 unsigned char *pheader, *sizep;
530 char **sets = 0;
531 int munged = 0, is_sign;
532 size_t plen;
533
534 (void)ad_reqd;
535 (void) do_bit;
536
537 #ifdef HAVE_IPSET
538 /* Similar algorithm to search_servers. */
539 struct ipsets *ipset_pos;
540 unsigned int namelen = strlen(daemon->namebuff);
541 unsigned int matchlen = 0;
542 for (ipset_pos = daemon->ipsets; ipset_pos; ipset_pos = ipset_pos->next)
543 {
544 unsigned int domainlen = strlen(ipset_pos->domain);
545 char *matchstart = daemon->namebuff + namelen - domainlen;
546 if (namelen >= domainlen && hostname_isequal(matchstart, ipset_pos->domain) &&
547 (domainlen == 0 || namelen == domainlen || *(matchstart - 1) == '.' ) &&
548 domainlen >= matchlen)
549 {
550 matchlen = domainlen;
551 sets = ipset_pos->sets;
552 }
553 }
554 #endif
555
556 /* If upstream is advertising a larger UDP packet size
557 than we allow, trim it so that we don't get overlarge
558 requests for the client. We can't do this for signed packets. */
559
560 if ((pheader = find_pseudoheader(header, n, &plen, &sizep, &is_sign)))
561 {
562 unsigned short udpsz;
563 unsigned char *psave = sizep;
564
565 GETSHORT(udpsz, sizep);
566
567 if (!is_sign && udpsz > daemon->edns_pktsz)
568 PUTSHORT(daemon->edns_pktsz, psave);
569
570 if (check_subnet && !check_source(header, plen, pheader, query_source))
571 {
572 my_syslog(LOG_WARNING, _("discarding DNS reply: subnet option mismatch"));
573 return 0;
574 }
575
576 if (added_pheader)
577 {
578 pheader = 0;
579 header->arcount = htons(0);
580 }
581 }
582
583 /* RFC 4035 sect 4.6 para 3 */
584 if (!is_sign && !option_bool(OPT_DNSSEC_PROXY))
585 header->hb4 &= ~HB4_AD;
586
587 if (OPCODE(header) != QUERY || (RCODE(header) != NOERROR && RCODE(header) != NXDOMAIN))
588 return n;
589
590 /* Complain loudly if the upstream server is non-recursive. */
591 if (!(header->hb4 & HB4_RA) && RCODE(header) == NOERROR && ntohs(header->ancount) == 0 &&
592 server && !(server->flags & SERV_WARNED_RECURSIVE))
593 {
594 prettyprint_addr(&server->addr, daemon->namebuff);
595 my_syslog(LOG_WARNING, _("nameserver %s refused to do a recursive query"), daemon->namebuff);
596 if (!option_bool(OPT_LOG))
597 server->flags |= SERV_WARNED_RECURSIVE;
598 }
599
600 if (daemon->bogus_addr && RCODE(header) != NXDOMAIN &&
601 check_for_bogus_wildcard(header, n, daemon->namebuff, daemon->bogus_addr, now))
602 {
603 munged = 1;
604 SET_RCODE(header, NXDOMAIN);
605 header->hb3 &= ~HB3_AA;
606 cache_secure = 0;
607 }
608 else
609 {
610 int doctored = 0;
611
612 if (RCODE(header) == NXDOMAIN &&
613 extract_request(header, n, daemon->namebuff, NULL) &&
614 check_for_local_domain(daemon->namebuff, now))
615 {
616 /* if we forwarded a query for a locally known name (because it was for
617 an unknown type) and the answer is NXDOMAIN, convert that to NODATA,
618 since we know that the domain exists, even if upstream doesn't */
619 munged = 1;
620 header->hb3 |= HB3_AA;
621 SET_RCODE(header, NOERROR);
622 cache_secure = 0;
623 }
624
625 if (extract_addresses(header, n, daemon->namebuff, now, sets, is_sign, check_rebind, no_cache, cache_secure, &doctored))
626 {
627 my_syslog(LOG_WARNING, _("possible DNS-rebind attack detected: %s"), daemon->namebuff);
628 munged = 1;
629 cache_secure = 0;
630 }
631
632 if (doctored)
633 cache_secure = 0;
634 }
635
636 #ifdef HAVE_DNSSEC
637 if (no_cache && !(header->hb4 & HB4_CD))
638 {
639 if (!option_bool(OPT_DNSSEC_DEBUG))
640 {
641 /* Bogus reply, turn into SERVFAIL */
642 SET_RCODE(header, SERVFAIL);
643 munged = 1;
644 }
645 }
646
647 if (option_bool(OPT_DNSSEC_VALID))
648 header->hb4 &= ~HB4_AD;
649
650 if (!(header->hb4 & HB4_CD) && ad_reqd && cache_secure)
651 header->hb4 |= HB4_AD;
652
653 /* If the requestor didn't set the DO bit, don't return DNSSEC info. */
654 if (!do_bit)
655 n = filter_rrsigs(header, n);
656 #endif
657
658 /* do this after extract_addresses. Ensure NODATA reply and remove
659 nameserver info. */
660
661 if (munged)
662 {
663 header->ancount = htons(0);
664 header->nscount = htons(0);
665 header->arcount = htons(0);
666 }
667
668 /* the bogus-nxdomain stuff, doctor and NXDOMAIN->NODATA munging can all elide
669 sections of the packet. Find the new length here and put back pseudoheader
670 if it was removed. */
671 return resize_packet(header, n, pheader, plen);
672 }
673
674 /* sets new last_server */
675 void reply_query(int fd, int family, time_t now)
676 {
677 /* packet from peer server, extract data for cache, and send to
678 original requester */
679 struct dns_header *header;
680 union mysockaddr serveraddr;
681 struct frec *forward;
682 socklen_t addrlen = sizeof(serveraddr);
683 ssize_t n = recvfrom(fd, daemon->packet, daemon->packet_buff_sz, 0, &serveraddr.sa, &addrlen);
684 size_t nn;
685 struct server *server;
686 void *hash;
687 #ifndef HAVE_DNSSEC
688 unsigned int crc;
689 #endif
690
691 /* packet buffer overwritten */
692 daemon->srv_save = NULL;
693
694 /* Determine the address of the server replying so that we can mark that as good */
695 serveraddr.sa.sa_family = family;
696 #ifdef HAVE_IPV6
697 if (serveraddr.sa.sa_family == AF_INET6)
698 serveraddr.in6.sin6_flowinfo = 0;
699 #endif
700
701 header = (struct dns_header *)daemon->packet;
702
703 if (n < (int)sizeof(struct dns_header) || !(header->hb3 & HB3_QR))
704 return;
705
706 /* spoof check: answer must come from known server, */
707 for (server = daemon->servers; server; server = server->next)
708 if (!(server->flags & (SERV_LITERAL_ADDRESS | SERV_NO_ADDR)) &&
709 sockaddr_isequal(&server->addr, &serveraddr))
710 break;
711
712 if (!server)
713 return;
714
715 #ifdef HAVE_DNSSEC
716 hash = hash_questions(header, n, daemon->namebuff);
717 #else
718 hash = &crc;
719 crc = questions_crc(header, n, daemon->namebuff);
720 #endif
721
722 if (!(forward = lookup_frec(ntohs(header->id), hash)))
723 return;
724
725 if ((RCODE(header) == SERVFAIL || RCODE(header) == REFUSED) &&
726 !option_bool(OPT_ORDER) &&
727 forward->forwardall == 0)
728 /* for broken servers, attempt to send to another one. */
729 {
730 unsigned char *pheader;
731 size_t plen;
732 int is_sign;
733
734 /* recreate query from reply */
735 pheader = find_pseudoheader(header, (size_t)n, &plen, NULL, &is_sign);
736 if (!is_sign)
737 {
738 header->ancount = htons(0);
739 header->nscount = htons(0);
740 header->arcount = htons(0);
741 if ((nn = resize_packet(header, (size_t)n, pheader, plen)))
742 {
743 header->hb3 &= ~(HB3_QR | HB3_TC);
744 forward_query(-1, NULL, NULL, 0, header, nn, now, forward, 0, 0);
745 return;
746 }
747 }
748 }
749
750 server = forward->sentto;
751
752 if ((forward->sentto->flags & SERV_TYPE) == 0)
753 {
754 if (RCODE(header) == REFUSED)
755 server = NULL;
756 else
757 {
758 struct server *last_server;
759
760 /* find good server by address if possible, otherwise assume the last one we sent to */
761 for (last_server = daemon->servers; last_server; last_server = last_server->next)
762 if (!(last_server->flags & (SERV_LITERAL_ADDRESS | SERV_HAS_DOMAIN | SERV_FOR_NODOTS | SERV_NO_ADDR)) &&
763 sockaddr_isequal(&last_server->addr, &serveraddr))
764 {
765 server = last_server;
766 break;
767 }
768 }
769 if (!option_bool(OPT_ALL_SERVERS))
770 daemon->last_server = server;
771 }
772
773 /* If the answer is an error, keep the forward record in place in case
774 we get a good reply from another server. Kill it when we've
775 had replies from all to avoid filling the forwarding table when
776 everything is broken */
777 if (forward->forwardall == 0 || --forward->forwardall == 1 || RCODE(header) != SERVFAIL)
778 {
779 int check_rebind = 0, no_cache_dnssec = 0, cache_secure = 0;
780
781 if (option_bool(OPT_NO_REBIND))
782 check_rebind = !(forward->flags & FREC_NOREBIND);
783
784 /* Don't cache replies where DNSSEC validation was turned off, either
785 the upstream server told us so, or the original query specified it. */
786 if ((header->hb4 & HB4_CD) || (forward->flags & FREC_CHECKING_DISABLED))
787 no_cache_dnssec = 1;
788
789 #ifdef HAVE_DNSSEC
790 if (server && option_bool(OPT_DNSSEC_VALID) && !(forward->flags & FREC_CHECKING_DISABLED))
791 {
792 int status;
793
794 /* We've had a reply already, which we're validating. Ignore this duplicate */
795 if (forward->blocking_query)
796 return;
797
798 if (header->hb3 & HB3_TC)
799 {
800 /* Truncated answer can't be validated.
801 If this is an answer to a DNSSEC-generated query, we still
802 need to get the client to retry over TCP, so return
803 an answer with the TC bit set, even if the actual answer fits.
804 */
805 status = STAT_TRUNCATED;
806 }
807 else if (forward->flags & FREC_DNSKEY_QUERY)
808 status = dnssec_validate_by_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
809 else if (forward->flags & FREC_DS_QUERY)
810 {
811 status = dnssec_validate_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
812 if (status == STAT_NO_DS)
813 status = STAT_INSECURE;
814 }
815 else if (forward->flags & FREC_CHECK_NOSIGN)
816 status = do_check_sign(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
817 else
818 {
819 status = dnssec_validate_reply(now, header, n, daemon->namebuff, daemon->keyname, &forward->class, NULL);
820 if (status == STAT_NO_SIG)
821 {
822 if (option_bool(OPT_DNSSEC_NO_SIGN))
823 status = send_check_sign(now, header, n, daemon->namebuff, daemon->keyname);
824 else
825 status = STAT_INSECURE;
826 }
827 }
828 /* Can't validate, as we're missing key data. Put this
829 answer aside, whilst we get that. */
830 if (status == STAT_NEED_DS || status == STAT_NEED_DS_NEG || status == STAT_NEED_KEY)
831 {
832 struct frec *new, *orig;
833
834 /* Free any saved query */
835 if (forward->stash)
836 blockdata_free(forward->stash);
837
838 /* Now save reply pending receipt of key data */
839 if (!(forward->stash = blockdata_alloc((char *)header, n)))
840 return;
841 forward->stash_len = n;
842
843 anotherkey:
844 /* Find the original query that started it all.... */
845 for (orig = forward; orig->dependent; orig = orig->dependent);
846
847 if (--orig->work_counter == 0 || !(new = get_new_frec(now, NULL, 1)))
848 status = STAT_INSECURE;
849 else
850 {
851 int fd;
852 struct frec *next = new->next;
853 *new = *forward; /* copy everything, then overwrite */
854 new->next = next;
855 new->blocking_query = NULL;
856 new->rfd4 = NULL;
857 #ifdef HAVE_IPV6
858 new->rfd6 = NULL;
859 #endif
860 new->flags &= ~(FREC_DNSKEY_QUERY | FREC_DS_QUERY | FREC_CHECK_NOSIGN);
861
862 new->dependent = forward; /* to find query awaiting new one. */
863 forward->blocking_query = new; /* for garbage cleaning */
864 /* validate routines leave name of required record in daemon->keyname */
865 if (status == STAT_NEED_KEY)
866 {
867 new->flags |= FREC_DNSKEY_QUERY;
868 nn = dnssec_generate_query(header, ((char *) header) + daemon->packet_buff_sz,
869 daemon->keyname, forward->class, T_DNSKEY, &server->addr);
870 }
871 else
872 {
873 if (status == STAT_NEED_DS_NEG)
874 new->flags |= FREC_CHECK_NOSIGN;
875 else
876 new->flags |= FREC_DS_QUERY;
877 nn = dnssec_generate_query(header,((char *) header) + daemon->packet_buff_sz,
878 daemon->keyname, forward->class, T_DS, &server->addr);
879 }
880 if ((hash = hash_questions(header, nn, daemon->namebuff)))
881 memcpy(new->hash, hash, HASH_SIZE);
882 new->new_id = get_id();
883 header->id = htons(new->new_id);
884 /* Save query for retransmission */
885 new->stash = blockdata_alloc((char *)header, nn);
886 new->stash_len = nn;
887
888 /* Don't resend this. */
889 daemon->srv_save = NULL;
890
891 if (server->sfd)
892 fd = server->sfd->fd;
893 else
894 {
895 fd = -1;
896 #ifdef HAVE_IPV6
897 if (server->addr.sa.sa_family == AF_INET6)
898 {
899 if (new->rfd6 || (new->rfd6 = allocate_rfd(AF_INET6)))
900 fd = new->rfd6->fd;
901 }
902 else
903 #endif
904 {
905 if (new->rfd4 || (new->rfd4 = allocate_rfd(AF_INET)))
906 fd = new->rfd4->fd;
907 }
908 }
909
910 if (fd != -1)
911 {
912 while (sendto(fd, (char *)header, nn, 0, &server->addr.sa, sa_len(&server->addr)) == -1 && retry_send());
913 server->queries++;
914 }
915
916 return;
917 }
918 }
919
920 /* Ok, we reached far enough up the chain-of-trust that we can validate something.
921 Now wind back down, pulling back answers which wouldn't previously validate
922 and validate them with the new data. Note that if an answer needs multiple
923 keys to validate, we may find another key is needed, in which case we set off
924 down another branch of the tree. Once we get to the original answer
925 (FREC_DNSSEC_QUERY not set) and it validates, return it to the original requestor. */
926 while (forward->dependent)
927 {
928 struct frec *prev = forward->dependent;
929 free_frec(forward);
930 forward = prev;
931 forward->blocking_query = NULL; /* already gone */
932 blockdata_retrieve(forward->stash, forward->stash_len, (void *)header);
933 n = forward->stash_len;
934
935 if (status == STAT_SECURE)
936 {
937 if (forward->flags & FREC_DNSKEY_QUERY)
938 status = dnssec_validate_by_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
939 else if (forward->flags & FREC_DS_QUERY)
940 {
941 status = dnssec_validate_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
942 if (status == STAT_NO_DS)
943 status = STAT_INSECURE;
944 }
945 else if (forward->flags & FREC_CHECK_NOSIGN)
946 status = do_check_sign(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
947 else
948 {
949 status = dnssec_validate_reply(now, header, n, daemon->namebuff, daemon->keyname, &forward->class, NULL);
950 if (status == STAT_NO_SIG)
951 {
952 if (option_bool(OPT_DNSSEC_NO_SIGN))
953 status = send_check_sign(now, header, n, daemon->namebuff, daemon->keyname);
954 else
955 status = STAT_INSECURE;
956 }
957 }
958
959 if (status == STAT_NEED_DS || status == STAT_NEED_DS_NEG || status == STAT_NEED_KEY)
960 goto anotherkey;
961 }
962 }
963
964 if (status == STAT_TRUNCATED)
965 header->hb3 |= HB3_TC;
966 else
967 {
968 char *result;
969
970 if (forward->work_counter == 0)
971 result = "ABANDONED";
972 else
973 result = (status == STAT_SECURE ? "SECURE" : (status == STAT_INSECURE ? "INSECURE" : "BOGUS"));
974
975 log_query(F_KEYTAG | F_SECSTAT, "result", NULL, result);
976 }
977
978 no_cache_dnssec = 0;
979
980 if (status == STAT_SECURE)
981 cache_secure = 1;
982 else if (status == STAT_BOGUS)
983 no_cache_dnssec = 1;
984 }
985 #endif
986
987 /* restore CD bit to the value in the query */
988 if (forward->flags & FREC_CHECKING_DISABLED)
989 header->hb4 |= HB4_CD;
990 else
991 header->hb4 &= ~HB4_CD;
992
993 if ((nn = process_reply(header, now, server, (size_t)n, check_rebind, no_cache_dnssec, cache_secure,
994 forward->flags & FREC_AD_QUESTION, forward->flags & FREC_DO_QUESTION,
995 forward->flags & FREC_ADDED_PHEADER, forward->flags & FREC_HAS_SUBNET, &forward->source)))
996 {
997 header->id = htons(forward->orig_id);
998 header->hb4 |= HB4_RA; /* recursion if available */
999 send_from(forward->fd, option_bool(OPT_NOWILD) || option_bool (OPT_CLEVERBIND), daemon->packet, nn,
1000 &forward->source, &forward->dest, forward->iface);
1001 }
1002 free_frec(forward); /* cancel */
1003 }
1004 }
1005
1006
1007 void receive_query(struct listener *listen, time_t now)
1008 {
1009 struct dns_header *header = (struct dns_header *)daemon->packet;
1010 union mysockaddr source_addr;
1011 unsigned short type;
1012 struct all_addr dst_addr;
1013 struct in_addr netmask, dst_addr_4;
1014 size_t m;
1015 ssize_t n;
1016 int if_index = 0, auth_dns = 0;
1017 #ifdef HAVE_AUTH
1018 int local_auth = 0;
1019 #endif
1020 struct iovec iov[1];
1021 struct msghdr msg;
1022 struct cmsghdr *cmptr;
1023 union {
1024 struct cmsghdr align; /* this ensures alignment */
1025 #ifdef HAVE_IPV6
1026 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
1027 #endif
1028 #if defined(HAVE_LINUX_NETWORK)
1029 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
1030 #elif defined(IP_RECVDSTADDR) && defined(HAVE_SOLARIS_NETWORK)
1031 char control[CMSG_SPACE(sizeof(struct in_addr)) +
1032 CMSG_SPACE(sizeof(unsigned int))];
1033 #elif defined(IP_RECVDSTADDR)
1034 char control[CMSG_SPACE(sizeof(struct in_addr)) +
1035 CMSG_SPACE(sizeof(struct sockaddr_dl))];
1036 #endif
1037 } control_u;
1038 #ifdef HAVE_IPV6
1039 /* Can always get recvd interface for IPv6 */
1040 int check_dst = !option_bool(OPT_NOWILD) || listen->family == AF_INET6;
1041 #else
1042 int check_dst = !option_bool(OPT_NOWILD);
1043 #endif
1044
1045 /* packet buffer overwritten */
1046 daemon->srv_save = NULL;
1047
1048 dst_addr_4.s_addr = 0;
1049 netmask.s_addr = 0;
1050
1051 if (option_bool(OPT_NOWILD) && listen->iface)
1052 {
1053 auth_dns = listen->iface->dns_auth;
1054
1055 if (listen->family == AF_INET)
1056 {
1057 dst_addr_4 = listen->iface->addr.in.sin_addr;
1058 netmask = listen->iface->netmask;
1059 }
1060 }
1061
1062 iov[0].iov_base = daemon->packet;
1063 iov[0].iov_len = daemon->edns_pktsz;
1064
1065 msg.msg_control = control_u.control;
1066 msg.msg_controllen = sizeof(control_u);
1067 msg.msg_flags = 0;
1068 msg.msg_name = &source_addr;
1069 msg.msg_namelen = sizeof(source_addr);
1070 msg.msg_iov = iov;
1071 msg.msg_iovlen = 1;
1072
1073 if ((n = recvmsg(listen->fd, &msg, 0)) == -1)
1074 return;
1075
1076 if (n < (int)sizeof(struct dns_header) ||
1077 (msg.msg_flags & MSG_TRUNC) ||
1078 (header->hb3 & HB3_QR))
1079 return;
1080
1081 source_addr.sa.sa_family = listen->family;
1082
1083 if (listen->family == AF_INET)
1084 {
1085 /* Source-port == 0 is an error, we can't send back to that.
1086 http://www.ietf.org/mail-archive/web/dnsop/current/msg11441.html */
1087 if (source_addr.in.sin_port == 0)
1088 return;
1089 }
1090 #ifdef HAVE_IPV6
1091 else
1092 {
1093 /* Source-port == 0 is an error, we can't send back to that. */
1094 if (source_addr.in6.sin6_port == 0)
1095 return;
1096 source_addr.in6.sin6_flowinfo = 0;
1097 }
1098 #endif
1099
1100 /* We can be configured to only accept queries from at-most-one-hop-away addresses. */
1101 if (option_bool(OPT_LOCAL_SERVICE))
1102 {
1103 struct addrlist *addr;
1104 #ifdef HAVE_IPV6
1105 if (listen->family == AF_INET6)
1106 {
1107 for (addr = daemon->interface_addrs; addr; addr = addr->next)
1108 if ((addr->flags & ADDRLIST_IPV6) &&
1109 is_same_net6(&addr->addr.addr.addr6, &source_addr.in6.sin6_addr, addr->prefixlen))
1110 break;
1111 }
1112 else
1113 #endif
1114 {
1115 struct in_addr netmask;
1116 for (addr = daemon->interface_addrs; addr; addr = addr->next)
1117 {
1118 netmask.s_addr = 0xffffffff << (32 - addr->prefixlen);
1119 if (!(addr->flags & ADDRLIST_IPV6) &&
1120 is_same_net(addr->addr.addr.addr4, source_addr.in.sin_addr, netmask))
1121 break;
1122 }
1123 }
1124 if (!addr)
1125 {
1126 static int warned = 0;
1127 if (!warned)
1128 {
1129 my_syslog(LOG_WARNING, _("Ignoring query from non-local network"));
1130 warned = 1;
1131 }
1132 return;
1133 }
1134 }
1135
1136 if (check_dst)
1137 {
1138 struct ifreq ifr;
1139
1140 if (msg.msg_controllen < sizeof(struct cmsghdr))
1141 return;
1142
1143 #if defined(HAVE_LINUX_NETWORK)
1144 if (listen->family == AF_INET)
1145 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
1146 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_PKTINFO)
1147 {
1148 union {
1149 unsigned char *c;
1150 struct in_pktinfo *p;
1151 } p;
1152 p.c = CMSG_DATA(cmptr);
1153 dst_addr_4 = dst_addr.addr.addr4 = p.p->ipi_spec_dst;
1154 if_index = p.p->ipi_ifindex;
1155 }
1156 #elif defined(IP_RECVDSTADDR) && defined(IP_RECVIF)
1157 if (listen->family == AF_INET)
1158 {
1159 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
1160 {
1161 union {
1162 unsigned char *c;
1163 unsigned int *i;
1164 struct in_addr *a;
1165 #ifndef HAVE_SOLARIS_NETWORK
1166 struct sockaddr_dl *s;
1167 #endif
1168 } p;
1169 p.c = CMSG_DATA(cmptr);
1170 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVDSTADDR)
1171 dst_addr_4 = dst_addr.addr.addr4 = *(p.a);
1172 else if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVIF)
1173 #ifdef HAVE_SOLARIS_NETWORK
1174 if_index = *(p.i);
1175 #else
1176 if_index = p.s->sdl_index;
1177 #endif
1178 }
1179 }
1180 #endif
1181
1182 #ifdef HAVE_IPV6
1183 if (listen->family == AF_INET6)
1184 {
1185 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
1186 if (cmptr->cmsg_level == IPPROTO_IPV6 && cmptr->cmsg_type == daemon->v6pktinfo)
1187 {
1188 union {
1189 unsigned char *c;
1190 struct in6_pktinfo *p;
1191 } p;
1192 p.c = CMSG_DATA(cmptr);
1193
1194 dst_addr.addr.addr6 = p.p->ipi6_addr;
1195 if_index = p.p->ipi6_ifindex;
1196 }
1197 }
1198 #endif
1199
1200 /* enforce available interface configuration */
1201
1202 if (!indextoname(listen->fd, if_index, ifr.ifr_name))
1203 return;
1204
1205 if (!iface_check(listen->family, &dst_addr, ifr.ifr_name, &auth_dns))
1206 {
1207 if (!option_bool(OPT_CLEVERBIND))
1208 enumerate_interfaces(0);
1209 if (!loopback_exception(listen->fd, listen->family, &dst_addr, ifr.ifr_name) &&
1210 !label_exception(if_index, listen->family, &dst_addr))
1211 return;
1212 }
1213
1214 if (listen->family == AF_INET && option_bool(OPT_LOCALISE))
1215 {
1216 struct irec *iface;
1217
1218 /* get the netmask of the interface whch has the address we were sent to.
1219 This is no neccessarily the interface we arrived on. */
1220
1221 for (iface = daemon->interfaces; iface; iface = iface->next)
1222 if (iface->addr.sa.sa_family == AF_INET &&
1223 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
1224 break;
1225
1226 /* interface may be new */
1227 if (!iface && !option_bool(OPT_CLEVERBIND))
1228 enumerate_interfaces(0);
1229
1230 for (iface = daemon->interfaces; iface; iface = iface->next)
1231 if (iface->addr.sa.sa_family == AF_INET &&
1232 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
1233 break;
1234
1235 /* If we failed, abandon localisation */
1236 if (iface)
1237 netmask = iface->netmask;
1238 else
1239 dst_addr_4.s_addr = 0;
1240 }
1241 }
1242
1243 if (extract_request(header, (size_t)n, daemon->namebuff, &type))
1244 {
1245 #ifdef HAVE_AUTH
1246 struct auth_zone *zone;
1247 #endif
1248 char *types = querystr(auth_dns ? "auth" : "query", type);
1249
1250 if (listen->family == AF_INET)
1251 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
1252 (struct all_addr *)&source_addr.in.sin_addr, types);
1253 #ifdef HAVE_IPV6
1254 else
1255 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
1256 (struct all_addr *)&source_addr.in6.sin6_addr, types);
1257 #endif
1258
1259 #ifdef HAVE_AUTH
1260 /* find queries for zones we're authoritative for, and answer them directly */
1261 if (!auth_dns)
1262 for (zone = daemon->auth_zones; zone; zone = zone->next)
1263 if (in_zone(zone, daemon->namebuff, NULL))
1264 {
1265 auth_dns = 1;
1266 local_auth = 1;
1267 break;
1268 }
1269 #endif
1270 }
1271
1272 #ifdef HAVE_AUTH
1273 if (auth_dns)
1274 {
1275 m = answer_auth(header, ((char *) header) + daemon->packet_buff_sz, (size_t)n, now, &source_addr, local_auth);
1276 if (m >= 1)
1277 {
1278 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
1279 (char *)header, m, &source_addr, &dst_addr, if_index);
1280 daemon->auth_answer++;
1281 }
1282 }
1283 else
1284 #endif
1285 {
1286 int ad_reqd, do_bit;
1287 m = answer_request(header, ((char *) header) + daemon->packet_buff_sz, (size_t)n,
1288 dst_addr_4, netmask, now, &ad_reqd, &do_bit);
1289
1290 if (m >= 1)
1291 {
1292 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
1293 (char *)header, m, &source_addr, &dst_addr, if_index);
1294 daemon->local_answer++;
1295 }
1296 else if (forward_query(listen->fd, &source_addr, &dst_addr, if_index,
1297 header, (size_t)n, now, NULL, ad_reqd, do_bit))
1298 daemon->queries_forwarded++;
1299 else
1300 daemon->local_answer++;
1301 }
1302 }
1303
1304 #ifdef HAVE_DNSSEC
1305
1306 /* UDP: we've got an unsigned answer, return STAT_INSECURE if we can prove there's no DS
1307 and therefore the answer shouldn't be signed, or STAT_BOGUS if it should be, or
1308 STAT_NEED_DS_NEG and keyname if we need to do the query. */
1309 static int send_check_sign(time_t now, struct dns_header *header, size_t plen, char *name, char *keyname)
1310 {
1311 struct crec *crecp;
1312 char *name_start = name;
1313 int status = dnssec_chase_cname(now, header, plen, name, keyname);
1314
1315 if (status != STAT_INSECURE)
1316 return status;
1317
1318 while (1)
1319 {
1320 crecp = cache_find_by_name(NULL, name_start, now, F_DS);
1321
1322 if (crecp && (crecp->flags & F_DNSSECOK))
1323 return (crecp->flags & F_NEG) ? STAT_INSECURE : STAT_BOGUS;
1324
1325 if (crecp && (crecp->flags & F_NEG) && (name_start = strchr(name_start, '.')))
1326 {
1327 name_start++; /* chop a label off and try again */
1328 continue;
1329 }
1330
1331 /* Reached the root */
1332 if (!name_start)
1333 return STAT_BOGUS;
1334
1335 strcpy(keyname, name_start);
1336 return STAT_NEED_DS_NEG;
1337 }
1338 }
1339
1340 /* Got answer to DS query from send_check_sign, check for proven non-existence, or make the next DS query to try. */
1341 static int do_check_sign(time_t now, struct dns_header *header, size_t plen, char *name, char *keyname, int class)
1342
1343 {
1344 char *name_start;
1345 unsigned char *p;
1346 int status = dnssec_validate_ds(now, header, plen, name, keyname, class);
1347
1348 if (status != STAT_INSECURE)
1349 {
1350 if (status == STAT_NO_DS)
1351 status = STAT_INSECURE;
1352 return status;
1353 }
1354
1355 p = (unsigned char *)(header+1);
1356
1357 if (extract_name(header, plen, &p, name, 1, 4) &&
1358 (name_start = strchr(name, '.')))
1359 {
1360 name_start++; /* chop a label off and try again */
1361 strcpy(keyname, name_start);
1362 return STAT_NEED_DS_NEG;
1363 }
1364
1365 return STAT_BOGUS;
1366 }
1367
1368 /* Move toward the root, until we find a signed non-existance of a DS, in which case
1369 an unsigned answer is OK, or we find a signed DS, in which case there should be
1370 a signature, and the answer is BOGUS */
1371 static int tcp_check_for_unsigned_zone(time_t now, struct dns_header *header, size_t plen, int class, char *name,
1372 char *keyname, struct server *server, int *keycount)
1373 {
1374 size_t m;
1375 unsigned char *packet, *payload;
1376 u16 *length;
1377 unsigned char *p = (unsigned char *)(header+1);
1378 int status;
1379 char *name_start = name;
1380
1381 /* Get first insecure entry in CNAME chain */
1382 status = tcp_key_recurse(now, STAT_CHASE_CNAME, header, plen, class, name, keyname, server, keycount);
1383 if (status == STAT_BOGUS)
1384 return STAT_BOGUS;
1385
1386 if (!(packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16))))
1387 return STAT_BOGUS;
1388
1389 payload = &packet[2];
1390 header = (struct dns_header *)payload;
1391 length = (u16 *)packet;
1392
1393 while (1)
1394 {
1395 unsigned char *newhash, hash[HASH_SIZE];
1396 unsigned char c1, c2;
1397 struct crec *crecp = cache_find_by_name(NULL, name_start, now, F_DS);
1398
1399 if (--(*keycount) == 0)
1400 {
1401 free(packet);
1402 return STAT_BOGUS;
1403 }
1404
1405 if (crecp && (crecp->flags & F_DNSSECOK))
1406 {
1407 free(packet);
1408 return (crecp->flags & F_NEG) ? STAT_INSECURE : STAT_BOGUS;
1409 }
1410
1411 /* If we have cached insecurely that a DS doesn't exist,
1412 ise that is a hit for where to start looking for the secure one */
1413 if (crecp && (crecp->flags & F_NEG) && (name_start = strchr(name_start, '.')))
1414 {
1415 name_start++; /* chop a label off and try again */
1416 continue;
1417 }
1418
1419 /* reached the root */
1420 if (!name_start)
1421 {
1422 free(packet);
1423 return STAT_BOGUS;
1424 }
1425
1426 m = dnssec_generate_query(header, ((char *) header) + 65536, name_start, class, T_DS, &server->addr);
1427
1428 /* We rely on the question section coming back unchanged, ensure it is with the hash. */
1429 if ((newhash = hash_questions(header, (unsigned int)m, name)))
1430 {
1431 memcpy(hash, newhash, HASH_SIZE);
1432
1433 *length = htons(m);
1434
1435 if (read_write(server->tcpfd, packet, m + sizeof(u16), 0) &&
1436 read_write(server->tcpfd, &c1, 1, 1) &&
1437 read_write(server->tcpfd, &c2, 1, 1) &&
1438 read_write(server->tcpfd, payload, (c1 << 8) | c2, 1))
1439 {
1440 m = (c1 << 8) | c2;
1441
1442 newhash = hash_questions(header, (unsigned int)m, name);
1443 if (newhash && memcmp(hash, newhash, HASH_SIZE) == 0)
1444 {
1445 /* Note this trashes all three name workspaces */
1446 status = tcp_key_recurse(now, STAT_NEED_DS_NEG, header, m, class, name, keyname, server, keycount);
1447
1448 /* We've found a DS which proves the bit of the DNS where the
1449 original query is, is unsigned, so the answer is OK,
1450 if unvalidated. */
1451 if (status == STAT_NO_DS)
1452 {
1453 free(packet);
1454 return STAT_INSECURE;
1455 }
1456
1457 /* No DS, not got to DNSSEC-land yet, go up. */
1458 if (status == STAT_INSECURE)
1459 {
1460 p = (unsigned char *)(header+1);
1461
1462 if (extract_name(header, plen, &p, name, 1, 4) &&
1463 (name_start = strchr(name, '.')))
1464 {
1465 name_start++; /* chop a label off and try again */
1466 continue;
1467 }
1468 }
1469 }
1470 }
1471 }
1472
1473 free(packet);
1474
1475 return STAT_BOGUS;
1476 }
1477 }
1478
1479 static int tcp_key_recurse(time_t now, int status, struct dns_header *header, size_t n,
1480 int class, char *name, char *keyname, struct server *server, int *keycount)
1481 {
1482 /* Recurse up the key heirarchy */
1483 int new_status;
1484
1485 /* limit the amount of work we do, to avoid cycling forever on loops in the DNS */
1486 if (--(*keycount) == 0)
1487 return STAT_INSECURE;
1488
1489 if (status == STAT_NEED_KEY)
1490 new_status = dnssec_validate_by_ds(now, header, n, name, keyname, class);
1491 else if (status == STAT_NEED_DS || status == STAT_NEED_DS_NEG)
1492 {
1493 new_status = dnssec_validate_ds(now, header, n, name, keyname, class);
1494 if (status == STAT_NEED_DS && new_status == STAT_NO_DS)
1495 new_status = STAT_INSECURE;
1496 }
1497 else if (status == STAT_CHASE_CNAME)
1498 new_status = dnssec_chase_cname(now, header, n, name, keyname);
1499 else
1500 {
1501 new_status = dnssec_validate_reply(now, header, n, name, keyname, &class, NULL);
1502
1503 if (new_status == STAT_NO_SIG)
1504 {
1505 if (option_bool(OPT_DNSSEC_NO_SIGN))
1506 new_status = tcp_check_for_unsigned_zone(now, header, n, class, name, keyname, server, keycount);
1507 else
1508 new_status = STAT_INSECURE;
1509 }
1510 }
1511
1512 /* Can't validate because we need a key/DS whose name now in keyname.
1513 Make query for same, and recurse to validate */
1514 if (new_status == STAT_NEED_DS || new_status == STAT_NEED_KEY)
1515 {
1516 size_t m;
1517 unsigned char *packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16));
1518 unsigned char *payload = &packet[2];
1519 struct dns_header *new_header = (struct dns_header *)payload;
1520 u16 *length = (u16 *)packet;
1521 unsigned char c1, c2;
1522
1523 if (!packet)
1524 return STAT_INSECURE;
1525
1526 another_tcp_key:
1527 m = dnssec_generate_query(new_header, ((char *) new_header) + 65536, keyname, class,
1528 new_status == STAT_NEED_KEY ? T_DNSKEY : T_DS, &server->addr);
1529
1530 *length = htons(m);
1531
1532 if (!read_write(server->tcpfd, packet, m + sizeof(u16), 0) ||
1533 !read_write(server->tcpfd, &c1, 1, 1) ||
1534 !read_write(server->tcpfd, &c2, 1, 1) ||
1535 !read_write(server->tcpfd, payload, (c1 << 8) | c2, 1))
1536 new_status = STAT_INSECURE;
1537 else
1538 {
1539 m = (c1 << 8) | c2;
1540
1541 new_status = tcp_key_recurse(now, new_status, new_header, m, class, name, keyname, server, keycount);
1542
1543 if (new_status == STAT_SECURE)
1544 {
1545 /* Reached a validated record, now try again at this level.
1546 Note that we may get ANOTHER NEED_* if an answer needs more than one key.
1547 If so, go round again. */
1548
1549 if (status == STAT_NEED_KEY)
1550 new_status = dnssec_validate_by_ds(now, header, n, name, keyname, class);
1551 else if (status == STAT_NEED_DS || status == STAT_NEED_DS_NEG)
1552 {
1553 new_status = dnssec_validate_ds(now, header, n, name, keyname, class);
1554 if (status == STAT_NEED_DS && new_status == STAT_NO_DS)
1555 new_status = STAT_INSECURE; /* Validated no DS */
1556 }
1557 else if (status == STAT_CHASE_CNAME)
1558 new_status = dnssec_chase_cname(now, header, n, name, keyname);
1559 else
1560 {
1561 new_status = dnssec_validate_reply(now, header, n, name, keyname, &class, NULL);
1562
1563 if (new_status == STAT_NO_SIG)
1564 {
1565 if (option_bool(OPT_DNSSEC_NO_SIGN))
1566 new_status = tcp_check_for_unsigned_zone(now, header, n, class, name, keyname, server, keycount);
1567 else
1568 new_status = STAT_INSECURE;
1569 }
1570 }
1571
1572 if (new_status == STAT_NEED_DS || new_status == STAT_NEED_KEY)
1573 goto another_tcp_key;
1574 }
1575 }
1576
1577 free(packet);
1578 }
1579 return new_status;
1580 }
1581 #endif
1582
1583
1584 /* The daemon forks before calling this: it should deal with one connection,
1585 blocking as neccessary, and then return. Note, need to be a bit careful
1586 about resources for debug mode, when the fork is suppressed: that's
1587 done by the caller. */
1588 unsigned char *tcp_request(int confd, time_t now,
1589 union mysockaddr *local_addr, struct in_addr netmask, int auth_dns)
1590 {
1591 size_t size = 0;
1592 int norebind = 0;
1593 #ifdef HAVE_AUTH
1594 int local_auth = 0;
1595 #endif
1596 int checking_disabled, ad_question, do_bit, added_pheader = 0;
1597 int check_subnet, no_cache_dnssec = 0, cache_secure = 0;
1598 size_t m;
1599 unsigned short qtype;
1600 unsigned int gotname;
1601 unsigned char c1, c2;
1602 /* Max TCP packet + slop + size */
1603 unsigned char *packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16));
1604 unsigned char *payload = &packet[2];
1605 /* largest field in header is 16-bits, so this is still sufficiently aligned */
1606 struct dns_header *header = (struct dns_header *)payload;
1607 u16 *length = (u16 *)packet;
1608 struct server *last_server;
1609 struct in_addr dst_addr_4;
1610 union mysockaddr peer_addr;
1611 socklen_t peer_len = sizeof(union mysockaddr);
1612
1613 if (getpeername(confd, (struct sockaddr *)&peer_addr, &peer_len) == -1)
1614 return packet;
1615
1616 /* We can be configured to only accept queries from at-most-one-hop-away addresses. */
1617 if (option_bool(OPT_LOCAL_SERVICE))
1618 {
1619 struct addrlist *addr;
1620 #ifdef HAVE_IPV6
1621 if (peer_addr.sa.sa_family == AF_INET6)
1622 {
1623 for (addr = daemon->interface_addrs; addr; addr = addr->next)
1624 if ((addr->flags & ADDRLIST_IPV6) &&
1625 is_same_net6(&addr->addr.addr.addr6, &peer_addr.in6.sin6_addr, addr->prefixlen))
1626 break;
1627 }
1628 else
1629 #endif
1630 {
1631 struct in_addr netmask;
1632 for (addr = daemon->interface_addrs; addr; addr = addr->next)
1633 {
1634 netmask.s_addr = 0xffffffff << (32 - addr->prefixlen);
1635 if (!(addr->flags & ADDRLIST_IPV6) &&
1636 is_same_net(addr->addr.addr.addr4, peer_addr.in.sin_addr, netmask))
1637 break;
1638 }
1639 }
1640 if (!addr)
1641 {
1642 my_syslog(LOG_WARNING, _("Ignoring query from non-local network"));
1643 return packet;
1644 }
1645 }
1646
1647 while (1)
1648 {
1649 if (!packet ||
1650 !read_write(confd, &c1, 1, 1) || !read_write(confd, &c2, 1, 1) ||
1651 !(size = c1 << 8 | c2) ||
1652 !read_write(confd, payload, size, 1))
1653 return packet;
1654
1655 if (size < (int)sizeof(struct dns_header))
1656 continue;
1657
1658 check_subnet = 0;
1659
1660 /* save state of "cd" flag in query */
1661 if ((checking_disabled = header->hb4 & HB4_CD))
1662 no_cache_dnssec = 1;
1663
1664 if ((gotname = extract_request(header, (unsigned int)size, daemon->namebuff, &qtype)))
1665 {
1666 #ifdef HAVE_AUTH
1667 struct auth_zone *zone;
1668 #endif
1669 char *types = querystr(auth_dns ? "auth" : "query", qtype);
1670
1671 if (peer_addr.sa.sa_family == AF_INET)
1672 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
1673 (struct all_addr *)&peer_addr.in.sin_addr, types);
1674 #ifdef HAVE_IPV6
1675 else
1676 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
1677 (struct all_addr *)&peer_addr.in6.sin6_addr, types);
1678 #endif
1679
1680 #ifdef HAVE_AUTH
1681 /* find queries for zones we're authoritative for, and answer them directly */
1682 if (!auth_dns)
1683 for (zone = daemon->auth_zones; zone; zone = zone->next)
1684 if (in_zone(zone, daemon->namebuff, NULL))
1685 {
1686 auth_dns = 1;
1687 local_auth = 1;
1688 break;
1689 }
1690 #endif
1691 }
1692
1693 if (local_addr->sa.sa_family == AF_INET)
1694 dst_addr_4 = local_addr->in.sin_addr;
1695 else
1696 dst_addr_4.s_addr = 0;
1697
1698 #ifdef HAVE_AUTH
1699 if (auth_dns)
1700 m = answer_auth(header, ((char *) header) + 65536, (size_t)size, now, &peer_addr, local_auth);
1701 else
1702 #endif
1703 {
1704 /* m > 0 if answered from cache */
1705 m = answer_request(header, ((char *) header) + 65536, (size_t)size,
1706 dst_addr_4, netmask, now, &ad_question, &do_bit);
1707
1708 /* Do this by steam now we're not in the select() loop */
1709 check_log_writer(NULL);
1710
1711 if (m == 0)
1712 {
1713 unsigned int flags = 0;
1714 struct all_addr *addrp = NULL;
1715 int type = 0;
1716 char *domain = NULL;
1717
1718 if (option_bool(OPT_ADD_MAC))
1719 size = add_mac(header, size, ((char *) header) + 65536, &peer_addr);
1720
1721 if (option_bool(OPT_CLIENT_SUBNET))
1722 {
1723 size_t new = add_source_addr(header, size, ((char *) header) + 65536, &peer_addr);
1724 if (size != new)
1725 {
1726 size = new;
1727 check_subnet = 1;
1728 }
1729 }
1730
1731 if (gotname)
1732 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
1733
1734 if (type != 0 || option_bool(OPT_ORDER) || !daemon->last_server)
1735 last_server = daemon->servers;
1736 else
1737 last_server = daemon->last_server;
1738
1739 if (!flags && last_server)
1740 {
1741 struct server *firstsendto = NULL;
1742 #ifdef HAVE_DNSSEC
1743 unsigned char *newhash, hash[HASH_SIZE];
1744 if ((newhash = hash_questions(header, (unsigned int)size, daemon->keyname)))
1745 memcpy(hash, newhash, HASH_SIZE);
1746 else
1747 memset(hash, 0, HASH_SIZE);
1748 #else
1749 unsigned int crc = questions_crc(header, (unsigned int)size, daemon->namebuff);
1750 #endif
1751 /* Loop round available servers until we succeed in connecting to one.
1752 Note that this code subtley ensures that consecutive queries on this connection
1753 which can go to the same server, do so. */
1754 while (1)
1755 {
1756 if (!firstsendto)
1757 firstsendto = last_server;
1758 else
1759 {
1760 if (!(last_server = last_server->next))
1761 last_server = daemon->servers;
1762
1763 if (last_server == firstsendto)
1764 break;
1765 }
1766
1767 /* server for wrong domain */
1768 if (type != (last_server->flags & SERV_TYPE) ||
1769 (type == SERV_HAS_DOMAIN && !hostname_isequal(domain, last_server->domain)))
1770 continue;
1771
1772 if (last_server->tcpfd == -1)
1773 {
1774 if ((last_server->tcpfd = socket(last_server->addr.sa.sa_family, SOCK_STREAM, 0)) == -1)
1775 continue;
1776
1777 if ((!local_bind(last_server->tcpfd, &last_server->source_addr, last_server->interface, 1) ||
1778 connect(last_server->tcpfd, &last_server->addr.sa, sa_len(&last_server->addr)) == -1))
1779 {
1780 close(last_server->tcpfd);
1781 last_server->tcpfd = -1;
1782 continue;
1783 }
1784
1785 #ifdef HAVE_DNSSEC
1786 if (option_bool(OPT_DNSSEC_VALID))
1787 {
1788 size_t new_size = add_do_bit(header, size, ((char *) header) + 65536);
1789
1790 /* For debugging, set Checking Disabled, otherwise, have the upstream check too,
1791 this allows it to select auth servers when one is returning bad data. */
1792 if (option_bool(OPT_DNSSEC_DEBUG))
1793 header->hb4 |= HB4_CD;
1794
1795 if (size != new_size)
1796 added_pheader = 1;
1797
1798 size = new_size;
1799 }
1800 #endif
1801
1802 #ifdef HAVE_CONNTRACK
1803 /* Copy connection mark of incoming query to outgoing connection. */
1804 if (option_bool(OPT_CONNTRACK))
1805 {
1806 unsigned int mark;
1807 struct all_addr local;
1808 #ifdef HAVE_IPV6
1809 if (local_addr->sa.sa_family == AF_INET6)
1810 local.addr.addr6 = local_addr->in6.sin6_addr;
1811 else
1812 #endif
1813 local.addr.addr4 = local_addr->in.sin_addr;
1814
1815 if (get_incoming_mark(&peer_addr, &local, 1, &mark))
1816 setsockopt(last_server->tcpfd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
1817 }
1818 #endif
1819 }
1820
1821 *length = htons(size);
1822
1823 if (!read_write(last_server->tcpfd, packet, size + sizeof(u16), 0) ||
1824 !read_write(last_server->tcpfd, &c1, 1, 1) ||
1825 !read_write(last_server->tcpfd, &c2, 1, 1) ||
1826 !read_write(last_server->tcpfd, payload, (c1 << 8) | c2, 1))
1827 {
1828 close(last_server->tcpfd);
1829 last_server->tcpfd = -1;
1830 continue;
1831 }
1832
1833 m = (c1 << 8) | c2;
1834
1835 if (!gotname)
1836 strcpy(daemon->namebuff, "query");
1837 if (last_server->addr.sa.sa_family == AF_INET)
1838 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
1839 (struct all_addr *)&last_server->addr.in.sin_addr, NULL);
1840 #ifdef HAVE_IPV6
1841 else
1842 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
1843 (struct all_addr *)&last_server->addr.in6.sin6_addr, NULL);
1844 #endif
1845
1846 #ifdef HAVE_DNSSEC
1847 if (option_bool(OPT_DNSSEC_VALID) && !checking_disabled)
1848 {
1849 int keycount = DNSSEC_WORK; /* Limit to number of DNSSEC questions, to catch loops and avoid filling cache. */
1850 int status = tcp_key_recurse(now, STAT_TRUNCATED, header, m, 0, daemon->namebuff, daemon->keyname, last_server, &keycount);
1851 char *result;
1852
1853 if (keycount == 0)
1854 result = "ABANDONED";
1855 else
1856 result = (status == STAT_SECURE ? "SECURE" : (status == STAT_INSECURE ? "INSECURE" : "BOGUS"));
1857
1858 log_query(F_KEYTAG | F_SECSTAT, "result", NULL, result);
1859
1860 if (status == STAT_BOGUS)
1861 no_cache_dnssec = 1;
1862
1863 if (status == STAT_SECURE)
1864 cache_secure = 1;
1865 }
1866 #endif
1867
1868 /* restore CD bit to the value in the query */
1869 if (checking_disabled)
1870 header->hb4 |= HB4_CD;
1871 else
1872 header->hb4 &= ~HB4_CD;
1873
1874 /* There's no point in updating the cache, since this process will exit and
1875 lose the information after a few queries. We make this call for the alias and
1876 bogus-nxdomain side-effects. */
1877 /* If the crc of the question section doesn't match the crc we sent, then
1878 someone might be attempting to insert bogus values into the cache by
1879 sending replies containing questions and bogus answers. */
1880 #ifdef HAVE_DNSSEC
1881 newhash = hash_questions(header, (unsigned int)m, daemon->namebuff);
1882 if (!newhash || memcmp(hash, newhash, HASH_SIZE) != 0)
1883 {
1884 m = 0;
1885 break;
1886 }
1887 #else
1888 if (crc != questions_crc(header, (unsigned int)m, daemon->namebuff))
1889 {
1890 m = 0;
1891 break;
1892 }
1893 #endif
1894
1895 m = process_reply(header, now, last_server, (unsigned int)m,
1896 option_bool(OPT_NO_REBIND) && !norebind, no_cache_dnssec,
1897 cache_secure, ad_question, do_bit, added_pheader, check_subnet, &peer_addr);
1898
1899 break;
1900 }
1901 }
1902
1903 /* In case of local answer or no connections made. */
1904 if (m == 0)
1905 m = setup_reply(header, (unsigned int)size, addrp, flags, daemon->local_ttl);
1906 }
1907 }
1908
1909 check_log_writer(NULL);
1910
1911 *length = htons(m);
1912
1913 if (m == 0 || !read_write(confd, packet, m + sizeof(u16), 0))
1914 return packet;
1915 }
1916 }
1917
1918 static struct frec *allocate_frec(time_t now)
1919 {
1920 struct frec *f;
1921
1922 if ((f = (struct frec *)whine_malloc(sizeof(struct frec))))
1923 {
1924 f->next = daemon->frec_list;
1925 f->time = now;
1926 f->sentto = NULL;
1927 f->rfd4 = NULL;
1928 f->flags = 0;
1929 #ifdef HAVE_IPV6
1930 f->rfd6 = NULL;
1931 #endif
1932 #ifdef HAVE_DNSSEC
1933 f->dependent = NULL;
1934 f->blocking_query = NULL;
1935 f->stash = NULL;
1936 #endif
1937 daemon->frec_list = f;
1938 }
1939
1940 return f;
1941 }
1942
1943 static struct randfd *allocate_rfd(int family)
1944 {
1945 static int finger = 0;
1946 int i;
1947
1948 /* limit the number of sockets we have open to avoid starvation of
1949 (eg) TFTP. Once we have a reasonable number, randomness should be OK */
1950
1951 for (i = 0; i < RANDOM_SOCKS; i++)
1952 if (daemon->randomsocks[i].refcount == 0)
1953 {
1954 if ((daemon->randomsocks[i].fd = random_sock(family)) == -1)
1955 break;
1956
1957 daemon->randomsocks[i].refcount = 1;
1958 daemon->randomsocks[i].family = family;
1959 return &daemon->randomsocks[i];
1960 }
1961
1962 /* No free ones or cannot get new socket, grab an existing one */
1963 for (i = 0; i < RANDOM_SOCKS; i++)
1964 {
1965 int j = (i+finger) % RANDOM_SOCKS;
1966 if (daemon->randomsocks[j].refcount != 0 &&
1967 daemon->randomsocks[j].family == family &&
1968 daemon->randomsocks[j].refcount != 0xffff)
1969 {
1970 finger = j;
1971 daemon->randomsocks[j].refcount++;
1972 return &daemon->randomsocks[j];
1973 }
1974 }
1975
1976 return NULL; /* doom */
1977 }
1978 static void free_frec(struct frec *f)
1979 {
1980 if (f->rfd4 && --(f->rfd4->refcount) == 0)
1981 close(f->rfd4->fd);
1982
1983 f->rfd4 = NULL;
1984 f->sentto = NULL;
1985 f->flags = 0;
1986
1987 #ifdef HAVE_IPV6
1988 if (f->rfd6 && --(f->rfd6->refcount) == 0)
1989 close(f->rfd6->fd);
1990
1991 f->rfd6 = NULL;
1992 #endif
1993
1994 #ifdef HAVE_DNSSEC
1995 if (f->stash)
1996 {
1997 blockdata_free(f->stash);
1998 f->stash = NULL;
1999 }
2000
2001 /* Anything we're waiting on is pointless now, too */
2002 if (f->blocking_query)
2003 free_frec(f->blocking_query);
2004 f->blocking_query = NULL;
2005 f->dependent = NULL;
2006 #endif
2007 }
2008
2009 /* if wait==NULL return a free or older than TIMEOUT record.
2010 else return *wait zero if one available, or *wait is delay to
2011 when the oldest in-use record will expire. Impose an absolute
2012 limit of 4*TIMEOUT before we wipe things (for random sockets).
2013 If force is set, always return a result, even if we have
2014 to allocate above the limit. */
2015 struct frec *get_new_frec(time_t now, int *wait, int force)
2016 {
2017 struct frec *f, *oldest, *target;
2018 int count;
2019
2020 if (wait)
2021 *wait = 0;
2022
2023 for (f = daemon->frec_list, oldest = NULL, target = NULL, count = 0; f; f = f->next, count++)
2024 if (!f->sentto)
2025 target = f;
2026 else
2027 {
2028 if (difftime(now, f->time) >= 4*TIMEOUT)
2029 {
2030 free_frec(f);
2031 target = f;
2032 }
2033
2034 if (!oldest || difftime(f->time, oldest->time) <= 0)
2035 oldest = f;
2036 }
2037
2038 if (target)
2039 {
2040 target->time = now;
2041 return target;
2042 }
2043
2044 /* can't find empty one, use oldest if there is one
2045 and it's older than timeout */
2046 if (oldest && ((int)difftime(now, oldest->time)) >= TIMEOUT)
2047 {
2048 /* keep stuff for twice timeout if we can by allocating a new
2049 record instead */
2050 if (difftime(now, oldest->time) < 2*TIMEOUT &&
2051 count <= daemon->ftabsize &&
2052 (f = allocate_frec(now)))
2053 return f;
2054
2055 if (!wait)
2056 {
2057 free_frec(oldest);
2058 oldest->time = now;
2059 }
2060 return oldest;
2061 }
2062
2063 /* none available, calculate time 'till oldest record expires */
2064 if (!force && count > daemon->ftabsize)
2065 {
2066 static time_t last_log = 0;
2067
2068 if (oldest && wait)
2069 *wait = oldest->time + (time_t)TIMEOUT - now;
2070
2071 if ((int)difftime(now, last_log) > 5)
2072 {
2073 last_log = now;
2074 my_syslog(LOG_WARNING, _("Maximum number of concurrent DNS queries reached (max: %d)"), daemon->ftabsize);
2075 }
2076
2077 return NULL;
2078 }
2079
2080 if (!(f = allocate_frec(now)) && wait)
2081 /* wait one second on malloc failure */
2082 *wait = 1;
2083
2084 return f; /* OK if malloc fails and this is NULL */
2085 }
2086
2087 /* crc is all-ones if not known. */
2088 static struct frec *lookup_frec(unsigned short id, void *hash)
2089 {
2090 struct frec *f;
2091
2092 for(f = daemon->frec_list; f; f = f->next)
2093 if (f->sentto && f->new_id == id &&
2094 (!hash || memcmp(hash, f->hash, HASH_SIZE) == 0))
2095 return f;
2096
2097 return NULL;
2098 }
2099
2100 static struct frec *lookup_frec_by_sender(unsigned short id,
2101 union mysockaddr *addr,
2102 void *hash)
2103 {
2104 struct frec *f;
2105
2106 for(f = daemon->frec_list; f; f = f->next)
2107 if (f->sentto &&
2108 f->orig_id == id &&
2109 memcmp(hash, f->hash, HASH_SIZE) == 0 &&
2110 sockaddr_isequal(&f->source, addr))
2111 return f;
2112
2113 return NULL;
2114 }
2115
2116 /* A server record is going away, remove references to it */
2117 void server_gone(struct server *server)
2118 {
2119 struct frec *f;
2120
2121 for (f = daemon->frec_list; f; f = f->next)
2122 if (f->sentto && f->sentto == server)
2123 free_frec(f);
2124
2125 if (daemon->last_server == server)
2126 daemon->last_server = NULL;
2127
2128 if (daemon->srv_save == server)
2129 daemon->srv_save = NULL;
2130 }
2131
2132 /* return unique random ids. */
2133 static unsigned short get_id(void)
2134 {
2135 unsigned short ret = 0;
2136
2137 do
2138 ret = rand16();
2139 while (lookup_frec(ret, NULL));
2140
2141 return ret;
2142 }
2143
2144
2145
2146
2147