]>
git.ipfire.org Git - people/ms/dnsmasq.git/blob - src/forward.c
1 /* dnsmasq is Copyright (c) 2000-2014 Simon Kelley
3 This program is free software; you can redistribute it and/or modify
4 it under the terms of the GNU General Public License as published by
5 the Free Software Foundation; version 2 dated June, 1991, or
6 (at your option) version 3 dated 29 June, 2007.
8 This program is distributed in the hope that it will be useful,
9 but WITHOUT ANY WARRANTY; without even the implied warranty of
10 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11 GNU General Public License for more details.
13 You should have received a copy of the GNU General Public License
14 along with this program. If not, see <http://www.gnu.org/licenses/>.
19 static struct frec
*lookup_frec(unsigned short id
, void *hash
);
20 static struct frec
*lookup_frec_by_sender(unsigned short id
,
21 union mysockaddr
*addr
,
23 static unsigned short get_id(void);
24 static void free_frec(struct frec
*f
);
25 static struct randfd
*allocate_rfd(int family
);
28 static int tcp_key_recurse(time_t now
, int status
, struct dns_header
*header
, size_t n
,
29 int class, char *name
, char *keyname
, struct server
*server
, int *keycount
);
30 static int do_check_sign(time_t now
, struct dns_header
*header
, size_t plen
, char *name
, char *keyname
, int class);
31 static int send_check_sign(time_t now
, struct dns_header
*header
, size_t plen
, char *name
, char *keyname
);
35 /* Send a UDP packet with its source address set as "source"
36 unless nowild is true, when we just send it with the kernel default */
37 int send_from(int fd
, int nowild
, char *packet
, size_t len
,
38 union mysockaddr
*to
, struct all_addr
*source
,
44 struct cmsghdr align
; /* this ensures alignment */
45 #if defined(HAVE_LINUX_NETWORK)
46 char control
[CMSG_SPACE(sizeof(struct in_pktinfo
))];
47 #elif defined(IP_SENDSRCADDR)
48 char control
[CMSG_SPACE(sizeof(struct in_addr
))];
51 char control6
[CMSG_SPACE(sizeof(struct in6_pktinfo
))];
55 iov
[0].iov_base
= packet
;
58 msg
.msg_control
= NULL
;
59 msg
.msg_controllen
= 0;
62 msg
.msg_namelen
= sa_len(to
);
68 struct cmsghdr
*cmptr
;
69 msg
.msg_control
= &control_u
;
70 msg
.msg_controllen
= sizeof(control_u
);
71 cmptr
= CMSG_FIRSTHDR(&msg
);
73 if (to
->sa
.sa_family
== AF_INET
)
75 #if defined(HAVE_LINUX_NETWORK)
78 p
.ipi_spec_dst
= source
->addr
.addr4
;
79 memcpy(CMSG_DATA(cmptr
), &p
, sizeof(p
));
80 msg
.msg_controllen
= cmptr
->cmsg_len
= CMSG_LEN(sizeof(struct in_pktinfo
));
81 cmptr
->cmsg_level
= IPPROTO_IP
;
82 cmptr
->cmsg_type
= IP_PKTINFO
;
83 #elif defined(IP_SENDSRCADDR)
84 memcpy(CMSG_DATA(cmptr
), &(source
->addr
.addr4
), sizeof(source
->addr
.addr4
));
85 msg
.msg_controllen
= cmptr
->cmsg_len
= CMSG_LEN(sizeof(struct in_addr
));
86 cmptr
->cmsg_level
= IPPROTO_IP
;
87 cmptr
->cmsg_type
= IP_SENDSRCADDR
;
94 p
.ipi6_ifindex
= iface
; /* Need iface for IPv6 to handle link-local addrs */
95 p
.ipi6_addr
= source
->addr
.addr6
;
96 memcpy(CMSG_DATA(cmptr
), &p
, sizeof(p
));
97 msg
.msg_controllen
= cmptr
->cmsg_len
= CMSG_LEN(sizeof(struct in6_pktinfo
));
98 cmptr
->cmsg_type
= daemon
->v6pktinfo
;
99 cmptr
->cmsg_level
= IPPROTO_IPV6
;
102 (void)iface
; /* eliminate warning */
106 while (sendmsg(fd
, &msg
, 0) == -1)
111 /* If interface is still in DAD, EINVAL results - ignore that. */
115 my_syslog(LOG_ERR
, _("failed to send packet: %s"), strerror(errno
));
122 static unsigned int search_servers(time_t now
, struct all_addr
**addrpp
,
123 unsigned int qtype
, char *qdomain
, int *type
, char **domain
, int *norebind
)
126 /* If the query ends in the domain in one of our servers, set
127 domain to point to that name. We find the largest match to allow both
128 domain.org and sub.domain.org to exist. */
130 unsigned int namelen
= strlen(qdomain
);
131 unsigned int matchlen
= 0;
133 unsigned int flags
= 0;
135 for (serv
= daemon
->servers
; serv
; serv
=serv
->next
)
136 /* domain matches take priority over NODOTS matches */
137 if ((serv
->flags
& SERV_FOR_NODOTS
) && *type
!= SERV_HAS_DOMAIN
&& !strchr(qdomain
, '.') && namelen
!= 0)
139 unsigned int sflag
= serv
->addr
.sa
.sa_family
== AF_INET
? F_IPV4
: F_IPV6
;
140 *type
= SERV_FOR_NODOTS
;
141 if (serv
->flags
& SERV_NO_ADDR
)
143 else if (serv
->flags
& SERV_LITERAL_ADDRESS
)
148 if (serv
->addr
.sa
.sa_family
== AF_INET
)
149 *addrpp
= (struct all_addr
*)&serv
->addr
.in
.sin_addr
;
152 *addrpp
= (struct all_addr
*)&serv
->addr
.in6
.sin6_addr
;
155 else if (!flags
|| (flags
& F_NXDOMAIN
))
159 else if (serv
->flags
& SERV_HAS_DOMAIN
)
161 unsigned int domainlen
= strlen(serv
->domain
);
162 char *matchstart
= qdomain
+ namelen
- domainlen
;
163 if (namelen
>= domainlen
&&
164 hostname_isequal(matchstart
, serv
->domain
) &&
165 (domainlen
== 0 || namelen
== domainlen
|| *(matchstart
-1) == '.' ))
167 if (serv
->flags
& SERV_NO_REBIND
)
171 unsigned int sflag
= serv
->addr
.sa
.sa_family
== AF_INET
? F_IPV4
: F_IPV6
;
172 /* implement priority rules for --address and --server for same domain.
173 --address wins if the address is for the correct AF
174 --server wins otherwise. */
175 if (domainlen
!= 0 && domainlen
== matchlen
)
177 if ((serv
->flags
& SERV_LITERAL_ADDRESS
))
179 if (!(sflag
& qtype
) && flags
== 0)
184 if (flags
& (F_IPV4
| F_IPV6
))
189 if (domainlen
>= matchlen
)
191 *type
= serv
->flags
& (SERV_HAS_DOMAIN
| SERV_USE_RESOLV
| SERV_NO_REBIND
);
192 *domain
= serv
->domain
;
193 matchlen
= domainlen
;
194 if (serv
->flags
& SERV_NO_ADDR
)
196 else if (serv
->flags
& SERV_LITERAL_ADDRESS
)
201 if (serv
->addr
.sa
.sa_family
== AF_INET
)
202 *addrpp
= (struct all_addr
*)&serv
->addr
.in
.sin_addr
;
205 *addrpp
= (struct all_addr
*)&serv
->addr
.in6
.sin6_addr
;
208 else if (!flags
|| (flags
& F_NXDOMAIN
))
218 if (flags
== 0 && !(qtype
& F_QUERY
) &&
219 option_bool(OPT_NODOTS_LOCAL
) && !strchr(qdomain
, '.') && namelen
!= 0)
220 /* don't forward A or AAAA queries for simple names, except the empty name */
223 if (flags
== F_NXDOMAIN
&& check_for_local_domain(qdomain
, now
))
230 if (flags
== F_NXDOMAIN
|| flags
== F_NOERR
)
231 logflags
= F_NEG
| qtype
;
233 log_query(logflags
| flags
| F_CONFIG
| F_FORWARD
, qdomain
, *addrpp
, NULL
);
235 else if ((*type
) & SERV_USE_RESOLV
)
237 *type
= 0; /* use normal servers for this domain */
243 static int forward_query(int udpfd
, union mysockaddr
*udpaddr
,
244 struct all_addr
*dst_addr
, unsigned int dst_iface
,
245 struct dns_header
*header
, size_t plen
, time_t now
,
246 struct frec
*forward
, int ad_reqd
, int do_bit
)
249 int type
= 0, norebind
= 0;
250 struct all_addr
*addrp
= NULL
;
251 unsigned int flags
= 0;
252 struct server
*start
= NULL
;
254 void *hash
= hash_questions(header
, plen
, daemon
->namebuff
);
256 unsigned int crc
= questions_crc(header
, plen
, daemon
->namebuff
);
259 unsigned int gotname
= extract_request(header
, plen
, daemon
->namebuff
, NULL
);
263 /* may be no servers available. */
264 if (!daemon
->servers
)
266 else if (forward
|| (hash
&& (forward
= lookup_frec_by_sender(ntohs(header
->id
), udpaddr
, hash
))))
269 /* If we've already got an answer to this query, but we're awaiting keys for validation,
270 there's no point retrying the query, retry the key query instead...... */
271 if (forward
->blocking_query
)
275 while (forward
->blocking_query
)
276 forward
= forward
->blocking_query
;
278 blockdata_retrieve(forward
->stash
, forward
->stash_len
, (void *)header
);
279 plen
= forward
->stash_len
;
281 if (forward
->sentto
->addr
.sa
.sa_family
== AF_INET
)
282 log_query(F_DNSSEC
| F_IPV4
, "retry", (struct all_addr
*)&forward
->sentto
->addr
.in
.sin_addr
, "dnssec");
285 log_query(F_DNSSEC
| F_IPV6
, "retry", (struct all_addr
*)&forward
->sentto
->addr
.in6
.sin6_addr
, "dnssec");
288 if (forward
->sentto
->sfd
)
289 fd
= forward
->sentto
->sfd
->fd
;
293 if (forward
->sentto
->addr
.sa
.sa_family
== AF_INET6
)
294 fd
= forward
->rfd6
->fd
;
297 fd
= forward
->rfd4
->fd
;
300 while (sendto(fd
, (char *)header
, plen
, 0,
301 &forward
->sentto
->addr
.sa
,
302 sa_len(&forward
->sentto
->addr
)) == -1 && retry_send());
308 /* retry on existing query, send to all available servers */
309 domain
= forward
->sentto
->domain
;
310 forward
->sentto
->failed_queries
++;
311 if (!option_bool(OPT_ORDER
))
313 forward
->forwardall
= 1;
314 daemon
->last_server
= NULL
;
316 type
= forward
->sentto
->flags
& SERV_TYPE
;
317 if (!(start
= forward
->sentto
->next
))
318 start
= daemon
->servers
; /* at end of list, recycle */
319 header
->id
= htons(forward
->new_id
);
324 flags
= search_servers(now
, &addrp
, gotname
, daemon
->namebuff
, &type
, &domain
, &norebind
);
326 if (!flags
&& !(forward
= get_new_frec(now
, NULL
, 0)))
327 /* table full - server failure. */
332 forward
->source
= *udpaddr
;
333 forward
->dest
= *dst_addr
;
334 forward
->iface
= dst_iface
;
335 forward
->orig_id
= ntohs(header
->id
);
336 forward
->new_id
= get_id();
338 memcpy(forward
->hash
, hash
, HASH_SIZE
);
339 forward
->forwardall
= 0;
342 forward
->flags
|= FREC_NOREBIND
;
343 if (header
->hb4
& HB4_CD
)
344 forward
->flags
|= FREC_CHECKING_DISABLED
;
346 forward
->flags
|= FREC_AD_QUESTION
;
348 forward
->work_counter
= DNSSEC_WORK
;
350 forward
->flags
|= FREC_DO_QUESTION
;
353 header
->id
= htons(forward
->new_id
);
355 /* In strict_order mode, always try servers in the order
356 specified in resolv.conf, if a domain is given
357 always try all the available servers,
358 otherwise, use the one last known to work. */
362 if (option_bool(OPT_ORDER
))
363 start
= daemon
->servers
;
364 else if (!(start
= daemon
->last_server
) ||
365 daemon
->forwardcount
++ > FORWARD_TEST
||
366 difftime(now
, daemon
->forwardtime
) > FORWARD_TIME
)
368 start
= daemon
->servers
;
369 forward
->forwardall
= 1;
370 daemon
->forwardcount
= 0;
371 daemon
->forwardtime
= now
;
376 start
= daemon
->servers
;
377 if (!option_bool(OPT_ORDER
))
378 forward
->forwardall
= 1;
383 /* check for send errors here (no route to host)
384 if we fail to send to all nameservers, send back an error
385 packet straight away (helps modem users when offline) */
387 if (!flags
&& forward
)
389 struct server
*firstsentto
= start
;
392 if (option_bool(OPT_ADD_MAC
))
393 plen
= add_mac(header
, plen
, ((char *) header
) + daemon
->packet_buff_sz
, &forward
->source
);
395 if (option_bool(OPT_CLIENT_SUBNET
))
397 size_t new = add_source_addr(header
, plen
, ((char *) header
) + daemon
->packet_buff_sz
, &forward
->source
);
401 forward
->flags
|= FREC_HAS_SUBNET
;
406 if (option_bool(OPT_DNSSEC_VALID
))
408 size_t new_plen
= add_do_bit(header
, plen
, ((char *) header
) + daemon
->packet_buff_sz
);
410 /* For debugging, set Checking Disabled, otherwise, have the upstream check too,
411 this allows it to select auth servers when one is returning bad data. */
412 if (option_bool(OPT_DNSSEC_DEBUG
))
413 header
->hb4
|= HB4_CD
;
415 if (new_plen
!= plen
)
416 forward
->flags
|= FREC_ADDED_PHEADER
;
424 /* only send to servers dealing with our domain.
425 domain may be NULL, in which case server->domain
426 must be NULL also. */
428 if (type
== (start
->flags
& SERV_TYPE
) &&
429 (type
!= SERV_HAS_DOMAIN
|| hostname_isequal(domain
, start
->domain
)) &&
430 !(start
->flags
& SERV_LITERAL_ADDRESS
))
434 /* find server socket to use, may need to get random one. */
440 if (start
->addr
.sa
.sa_family
== AF_INET6
)
442 if (!forward
->rfd6
&&
443 !(forward
->rfd6
= allocate_rfd(AF_INET6
)))
445 daemon
->rfd_save
= forward
->rfd6
;
446 fd
= forward
->rfd6
->fd
;
451 if (!forward
->rfd4
&&
452 !(forward
->rfd4
= allocate_rfd(AF_INET
)))
454 daemon
->rfd_save
= forward
->rfd4
;
455 fd
= forward
->rfd4
->fd
;
458 #ifdef HAVE_CONNTRACK
459 /* Copy connection mark of incoming query to outgoing connection. */
460 if (option_bool(OPT_CONNTRACK
))
463 if (get_incoming_mark(&forward
->source
, &forward
->dest
, 0, &mark
))
464 setsockopt(fd
, SOL_SOCKET
, SO_MARK
, &mark
, sizeof(unsigned int));
469 if (sendto(fd
, (char *)header
, plen
, 0,
471 sa_len(&start
->addr
)) == -1)
478 /* Keep info in case we want to re-send this packet */
479 daemon
->srv_save
= start
;
480 daemon
->packet_len
= plen
;
483 strcpy(daemon
->namebuff
, "query");
484 if (start
->addr
.sa
.sa_family
== AF_INET
)
485 log_query(F_SERVER
| F_IPV4
| F_FORWARD
, daemon
->namebuff
,
486 (struct all_addr
*)&start
->addr
.in
.sin_addr
, NULL
);
489 log_query(F_SERVER
| F_IPV6
| F_FORWARD
, daemon
->namebuff
,
490 (struct all_addr
*)&start
->addr
.in6
.sin6_addr
, NULL
);
494 forward
->sentto
= start
;
495 if (!forward
->forwardall
)
497 forward
->forwardall
++;
501 if (!(start
= start
->next
))
502 start
= daemon
->servers
;
504 if (start
== firstsentto
)
511 /* could not send on, prepare to return */
512 header
->id
= htons(forward
->orig_id
);
513 free_frec(forward
); /* cancel */
516 /* could not send on, return empty answer or address if known for whole domain */
519 plen
= setup_reply(header
, plen
, addrp
, flags
, daemon
->local_ttl
);
520 send_from(udpfd
, option_bool(OPT_NOWILD
) || option_bool(OPT_CLEVERBIND
), (char *)header
, plen
, udpaddr
, dst_addr
, dst_iface
);
526 static size_t process_reply(struct dns_header
*header
, time_t now
, struct server
*server
, size_t n
, int check_rebind
,
527 int no_cache
, int cache_secure
, int ad_reqd
, int do_bit
, int added_pheader
, int check_subnet
, union mysockaddr
*query_source
)
529 unsigned char *pheader
, *sizep
;
531 int munged
= 0, is_sign
;
538 /* Similar algorithm to search_servers. */
539 struct ipsets
*ipset_pos
;
540 unsigned int namelen
= strlen(daemon
->namebuff
);
541 unsigned int matchlen
= 0;
542 for (ipset_pos
= daemon
->ipsets
; ipset_pos
; ipset_pos
= ipset_pos
->next
)
544 unsigned int domainlen
= strlen(ipset_pos
->domain
);
545 char *matchstart
= daemon
->namebuff
+ namelen
- domainlen
;
546 if (namelen
>= domainlen
&& hostname_isequal(matchstart
, ipset_pos
->domain
) &&
547 (domainlen
== 0 || namelen
== domainlen
|| *(matchstart
- 1) == '.' ) &&
548 domainlen
>= matchlen
)
550 matchlen
= domainlen
;
551 sets
= ipset_pos
->sets
;
556 /* If upstream is advertising a larger UDP packet size
557 than we allow, trim it so that we don't get overlarge
558 requests for the client. We can't do this for signed packets. */
560 if ((pheader
= find_pseudoheader(header
, n
, &plen
, &sizep
, &is_sign
)))
562 unsigned short udpsz
;
563 unsigned char *psave
= sizep
;
565 GETSHORT(udpsz
, sizep
);
567 if (!is_sign
&& udpsz
> daemon
->edns_pktsz
)
568 PUTSHORT(daemon
->edns_pktsz
, psave
);
570 if (check_subnet
&& !check_source(header
, plen
, pheader
, query_source
))
572 my_syslog(LOG_WARNING
, _("discarding DNS reply: subnet option mismatch"));
579 header
->arcount
= htons(0);
583 /* RFC 4035 sect 4.6 para 3 */
584 if (!is_sign
&& !option_bool(OPT_DNSSEC_PROXY
))
585 header
->hb4
&= ~HB4_AD
;
587 if (OPCODE(header
) != QUERY
|| (RCODE(header
) != NOERROR
&& RCODE(header
) != NXDOMAIN
))
590 /* Complain loudly if the upstream server is non-recursive. */
591 if (!(header
->hb4
& HB4_RA
) && RCODE(header
) == NOERROR
&& ntohs(header
->ancount
) == 0 &&
592 server
&& !(server
->flags
& SERV_WARNED_RECURSIVE
))
594 prettyprint_addr(&server
->addr
, daemon
->namebuff
);
595 my_syslog(LOG_WARNING
, _("nameserver %s refused to do a recursive query"), daemon
->namebuff
);
596 if (!option_bool(OPT_LOG
))
597 server
->flags
|= SERV_WARNED_RECURSIVE
;
600 if (daemon
->bogus_addr
&& RCODE(header
) != NXDOMAIN
&&
601 check_for_bogus_wildcard(header
, n
, daemon
->namebuff
, daemon
->bogus_addr
, now
))
604 SET_RCODE(header
, NXDOMAIN
);
605 header
->hb3
&= ~HB3_AA
;
612 if (RCODE(header
) == NXDOMAIN
&&
613 extract_request(header
, n
, daemon
->namebuff
, NULL
) &&
614 check_for_local_domain(daemon
->namebuff
, now
))
616 /* if we forwarded a query for a locally known name (because it was for
617 an unknown type) and the answer is NXDOMAIN, convert that to NODATA,
618 since we know that the domain exists, even if upstream doesn't */
620 header
->hb3
|= HB3_AA
;
621 SET_RCODE(header
, NOERROR
);
625 if (extract_addresses(header
, n
, daemon
->namebuff
, now
, sets
, is_sign
, check_rebind
, no_cache
, cache_secure
, &doctored
))
627 my_syslog(LOG_WARNING
, _("possible DNS-rebind attack detected: %s"), daemon
->namebuff
);
637 if (no_cache
&& !(header
->hb4
& HB4_CD
))
639 if (!option_bool(OPT_DNSSEC_DEBUG
))
641 /* Bogus reply, turn into SERVFAIL */
642 SET_RCODE(header
, SERVFAIL
);
647 if (option_bool(OPT_DNSSEC_VALID
))
648 header
->hb4
&= ~HB4_AD
;
650 if (!(header
->hb4
& HB4_CD
) && ad_reqd
&& cache_secure
)
651 header
->hb4
|= HB4_AD
;
653 /* If the requestor didn't set the DO bit, don't return DNSSEC info. */
655 n
= filter_rrsigs(header
, n
);
658 /* do this after extract_addresses. Ensure NODATA reply and remove
663 header
->ancount
= htons(0);
664 header
->nscount
= htons(0);
665 header
->arcount
= htons(0);
668 /* the bogus-nxdomain stuff, doctor and NXDOMAIN->NODATA munging can all elide
669 sections of the packet. Find the new length here and put back pseudoheader
670 if it was removed. */
671 return resize_packet(header
, n
, pheader
, plen
);
674 /* sets new last_server */
675 void reply_query(int fd
, int family
, time_t now
)
677 /* packet from peer server, extract data for cache, and send to
678 original requester */
679 struct dns_header
*header
;
680 union mysockaddr serveraddr
;
681 struct frec
*forward
;
682 socklen_t addrlen
= sizeof(serveraddr
);
683 ssize_t n
= recvfrom(fd
, daemon
->packet
, daemon
->packet_buff_sz
, 0, &serveraddr
.sa
, &addrlen
);
685 struct server
*server
;
691 /* packet buffer overwritten */
692 daemon
->srv_save
= NULL
;
694 /* Determine the address of the server replying so that we can mark that as good */
695 serveraddr
.sa
.sa_family
= family
;
697 if (serveraddr
.sa
.sa_family
== AF_INET6
)
698 serveraddr
.in6
.sin6_flowinfo
= 0;
701 header
= (struct dns_header
*)daemon
->packet
;
703 if (n
< (int)sizeof(struct dns_header
) || !(header
->hb3
& HB3_QR
))
706 /* spoof check: answer must come from known server, */
707 for (server
= daemon
->servers
; server
; server
= server
->next
)
708 if (!(server
->flags
& (SERV_LITERAL_ADDRESS
| SERV_NO_ADDR
)) &&
709 sockaddr_isequal(&server
->addr
, &serveraddr
))
716 hash
= hash_questions(header
, n
, daemon
->namebuff
);
719 crc
= questions_crc(header
, n
, daemon
->namebuff
);
722 if (!(forward
= lookup_frec(ntohs(header
->id
), hash
)))
725 if ((RCODE(header
) == SERVFAIL
|| RCODE(header
) == REFUSED
) &&
726 !option_bool(OPT_ORDER
) &&
727 forward
->forwardall
== 0)
728 /* for broken servers, attempt to send to another one. */
730 unsigned char *pheader
;
734 /* recreate query from reply */
735 pheader
= find_pseudoheader(header
, (size_t)n
, &plen
, NULL
, &is_sign
);
738 header
->ancount
= htons(0);
739 header
->nscount
= htons(0);
740 header
->arcount
= htons(0);
741 if ((nn
= resize_packet(header
, (size_t)n
, pheader
, plen
)))
743 header
->hb3
&= ~(HB3_QR
| HB3_TC
);
744 forward_query(-1, NULL
, NULL
, 0, header
, nn
, now
, forward
, 0, 0);
750 server
= forward
->sentto
;
752 if ((forward
->sentto
->flags
& SERV_TYPE
) == 0)
754 if (RCODE(header
) == SERVFAIL
|| RCODE(header
) == REFUSED
)
758 struct server
*last_server
;
760 /* find good server by address if possible, otherwise assume the last one we sent to */
761 for (last_server
= daemon
->servers
; last_server
; last_server
= last_server
->next
)
762 if (!(last_server
->flags
& (SERV_LITERAL_ADDRESS
| SERV_HAS_DOMAIN
| SERV_FOR_NODOTS
| SERV_NO_ADDR
)) &&
763 sockaddr_isequal(&last_server
->addr
, &serveraddr
))
765 server
= last_server
;
769 if (!option_bool(OPT_ALL_SERVERS
))
770 daemon
->last_server
= server
;
773 /* If the answer is an error, keep the forward record in place in case
774 we get a good reply from another server. Kill it when we've
775 had replies from all to avoid filling the forwarding table when
776 everything is broken */
777 if (forward
->forwardall
== 0 || --forward
->forwardall
== 1 ||
778 (RCODE(header
) != REFUSED
&& RCODE(header
) != SERVFAIL
))
780 int check_rebind
= 0, no_cache_dnssec
= 0, cache_secure
= 0;
782 if (option_bool(OPT_NO_REBIND
))
783 check_rebind
= !(forward
->flags
& FREC_NOREBIND
);
785 /* Don't cache replies where DNSSEC validation was turned off, either
786 the upstream server told us so, or the original query specified it. */
787 if ((header
->hb4
& HB4_CD
) || (forward
->flags
& FREC_CHECKING_DISABLED
))
791 if (option_bool(OPT_DNSSEC_VALID
) && !(forward
->flags
& FREC_CHECKING_DISABLED
))
795 /* We've had a reply already, which we're validating. Ignore this duplicate */
796 if (forward
->blocking_query
)
799 if (header
->hb3
& HB3_TC
)
801 /* Truncated answer can't be validated.
802 If this is an answer to a DNSSEC-generated query, we still
803 need to get the client to retry over TCP, so return
804 an answer with the TC bit set, even if the actual answer fits.
806 status
= STAT_TRUNCATED
;
808 else if (forward
->flags
& FREC_DNSKEY_QUERY
)
809 status
= dnssec_validate_by_ds(now
, header
, n
, daemon
->namebuff
, daemon
->keyname
, forward
->class);
810 else if (forward
->flags
& FREC_DS_QUERY
)
812 status
= dnssec_validate_ds(now
, header
, n
, daemon
->namebuff
, daemon
->keyname
, forward
->class);
813 if (status
== STAT_NO_DS
)
814 status
= STAT_INSECURE
;
816 else if (forward
->flags
& FREC_CHECK_NOSIGN
)
817 status
= do_check_sign(now
, header
, n
, daemon
->namebuff
, daemon
->keyname
, forward
->class);
820 status
= dnssec_validate_reply(now
, header
, n
, daemon
->namebuff
, daemon
->keyname
, &forward
->class, NULL
);
821 if (status
== STAT_NO_SIG
)
823 if (option_bool(OPT_DNSSEC_NO_SIGN
))
824 status
= send_check_sign(now
, header
, n
, daemon
->namebuff
, daemon
->keyname
);
826 status
= STAT_INSECURE
;
829 /* Can't validate, as we're missing key data. Put this
830 answer aside, whilst we get that. */
831 if (status
== STAT_NEED_DS
|| status
== STAT_NEED_DS_NEG
|| status
== STAT_NEED_KEY
)
833 struct frec
*new, *orig
;
835 /* Free any saved query */
837 blockdata_free(forward
->stash
);
839 /* Now save reply pending receipt of key data */
840 if (!(forward
->stash
= blockdata_alloc((char *)header
, n
)))
842 forward
->stash_len
= n
;
845 /* Find the original query that started it all.... */
846 for (orig
= forward
; orig
->dependent
; orig
= orig
->dependent
);
848 if (--orig
->work_counter
== 0 || !(new = get_new_frec(now
, NULL
, 1)))
849 status
= STAT_INSECURE
;
853 struct frec
*next
= new->next
;
854 *new = *forward
; /* copy everything, then overwrite */
856 new->blocking_query
= NULL
;
861 new->flags
&= ~(FREC_DNSKEY_QUERY
| FREC_DS_QUERY
| FREC_CHECK_NOSIGN
);
863 new->dependent
= forward
; /* to find query awaiting new one. */
864 forward
->blocking_query
= new; /* for garbage cleaning */
865 /* validate routines leave name of required record in daemon->keyname */
866 if (status
== STAT_NEED_KEY
)
868 new->flags
|= FREC_DNSKEY_QUERY
;
869 nn
= dnssec_generate_query(header
, ((char *) header
) + daemon
->packet_buff_sz
,
870 daemon
->keyname
, forward
->class, T_DNSKEY
, &server
->addr
);
874 if (status
== STAT_NEED_DS_NEG
)
875 new->flags
|= FREC_CHECK_NOSIGN
;
877 new->flags
|= FREC_DS_QUERY
;
878 nn
= dnssec_generate_query(header
,((char *) header
) + daemon
->packet_buff_sz
,
879 daemon
->keyname
, forward
->class, T_DS
, &server
->addr
);
881 if ((hash
= hash_questions(header
, nn
, daemon
->namebuff
)))
882 memcpy(new->hash
, hash
, HASH_SIZE
);
883 new->new_id
= get_id();
884 header
->id
= htons(new->new_id
);
885 /* Save query for retransmission */
886 new->stash
= blockdata_alloc((char *)header
, nn
);
889 /* Don't resend this. */
890 daemon
->srv_save
= NULL
;
893 fd
= server
->sfd
->fd
;
898 if (server
->addr
.sa
.sa_family
== AF_INET6
)
900 if (new->rfd6
|| (new->rfd6
= allocate_rfd(AF_INET6
)))
906 if (new->rfd4
|| (new->rfd4
= allocate_rfd(AF_INET
)))
913 while (sendto(fd
, (char *)header
, nn
, 0, &server
->addr
.sa
, sa_len(&server
->addr
)) == -1 && retry_send());
921 /* Ok, we reached far enough up the chain-of-trust that we can validate something.
922 Now wind back down, pulling back answers which wouldn't previously validate
923 and validate them with the new data. Note that if an answer needs multiple
924 keys to validate, we may find another key is needed, in which case we set off
925 down another branch of the tree. Once we get to the original answer
926 (FREC_DNSSEC_QUERY not set) and it validates, return it to the original requestor. */
927 while (forward
->dependent
)
929 struct frec
*prev
= forward
->dependent
;
932 forward
->blocking_query
= NULL
; /* already gone */
933 blockdata_retrieve(forward
->stash
, forward
->stash_len
, (void *)header
);
934 n
= forward
->stash_len
;
936 if (status
== STAT_SECURE
)
938 if (forward
->flags
& FREC_DNSKEY_QUERY
)
939 status
= dnssec_validate_by_ds(now
, header
, n
, daemon
->namebuff
, daemon
->keyname
, forward
->class);
940 else if (forward
->flags
& FREC_DS_QUERY
)
942 status
= dnssec_validate_ds(now
, header
, n
, daemon
->namebuff
, daemon
->keyname
, forward
->class);
943 if (status
== STAT_NO_DS
)
944 status
= STAT_INSECURE
;
946 else if (forward
->flags
& FREC_CHECK_NOSIGN
)
947 status
= do_check_sign(now
, header
, n
, daemon
->namebuff
, daemon
->keyname
, forward
->class);
950 status
= dnssec_validate_reply(now
, header
, n
, daemon
->namebuff
, daemon
->keyname
, &forward
->class, NULL
);
951 if (status
== STAT_NO_SIG
)
953 if (option_bool(OPT_DNSSEC_NO_SIGN
))
954 status
= send_check_sign(now
, header
, n
, daemon
->namebuff
, daemon
->keyname
);
956 status
= STAT_INSECURE
;
960 if (status
== STAT_NEED_DS
|| status
== STAT_NEED_DS_NEG
|| status
== STAT_NEED_KEY
)
965 if (status
== STAT_TRUNCATED
)
966 header
->hb3
|= HB3_TC
;
971 if (forward
->work_counter
== 0)
972 result
= "ABANDONED";
974 result
= (status
== STAT_SECURE
? "SECURE" : (status
== STAT_INSECURE
? "INSECURE" : "BOGUS"));
976 log_query(F_KEYTAG
| F_SECSTAT
, "result", NULL
, result
);
981 if (status
== STAT_SECURE
)
983 else if (status
== STAT_BOGUS
)
988 /* restore CD bit to the value in the query */
989 if (forward
->flags
& FREC_CHECKING_DISABLED
)
990 header
->hb4
|= HB4_CD
;
992 header
->hb4
&= ~HB4_CD
;
994 if ((nn
= process_reply(header
, now
, server
, (size_t)n
, check_rebind
, no_cache_dnssec
, cache_secure
,
995 forward
->flags
& FREC_AD_QUESTION
, forward
->flags
& FREC_DO_QUESTION
,
996 forward
->flags
& FREC_ADDED_PHEADER
, forward
->flags
& FREC_HAS_SUBNET
, &forward
->source
)))
998 header
->id
= htons(forward
->orig_id
);
999 header
->hb4
|= HB4_RA
; /* recursion if available */
1000 send_from(forward
->fd
, option_bool(OPT_NOWILD
) || option_bool (OPT_CLEVERBIND
), daemon
->packet
, nn
,
1001 &forward
->source
, &forward
->dest
, forward
->iface
);
1003 free_frec(forward
); /* cancel */
1008 void receive_query(struct listener
*listen
, time_t now
)
1010 struct dns_header
*header
= (struct dns_header
*)daemon
->packet
;
1011 union mysockaddr source_addr
;
1012 unsigned short type
;
1013 struct all_addr dst_addr
;
1014 struct in_addr netmask
, dst_addr_4
;
1017 int if_index
= 0, auth_dns
= 0;
1021 struct iovec iov
[1];
1023 struct cmsghdr
*cmptr
;
1025 struct cmsghdr align
; /* this ensures alignment */
1027 char control6
[CMSG_SPACE(sizeof(struct in6_pktinfo
))];
1029 #if defined(HAVE_LINUX_NETWORK)
1030 char control
[CMSG_SPACE(sizeof(struct in_pktinfo
))];
1031 #elif defined(IP_RECVDSTADDR) && defined(HAVE_SOLARIS_NETWORK)
1032 char control
[CMSG_SPACE(sizeof(struct in_addr
)) +
1033 CMSG_SPACE(sizeof(unsigned int))];
1034 #elif defined(IP_RECVDSTADDR)
1035 char control
[CMSG_SPACE(sizeof(struct in_addr
)) +
1036 CMSG_SPACE(sizeof(struct sockaddr_dl
))];
1040 /* Can always get recvd interface for IPv6 */
1041 int check_dst
= !option_bool(OPT_NOWILD
) || listen
->family
== AF_INET6
;
1043 int check_dst
= !option_bool(OPT_NOWILD
);
1046 /* packet buffer overwritten */
1047 daemon
->srv_save
= NULL
;
1049 dst_addr_4
.s_addr
= 0;
1052 if (option_bool(OPT_NOWILD
) && listen
->iface
)
1054 auth_dns
= listen
->iface
->dns_auth
;
1056 if (listen
->family
== AF_INET
)
1058 dst_addr_4
= listen
->iface
->addr
.in
.sin_addr
;
1059 netmask
= listen
->iface
->netmask
;
1063 iov
[0].iov_base
= daemon
->packet
;
1064 iov
[0].iov_len
= daemon
->edns_pktsz
;
1066 msg
.msg_control
= control_u
.control
;
1067 msg
.msg_controllen
= sizeof(control_u
);
1069 msg
.msg_name
= &source_addr
;
1070 msg
.msg_namelen
= sizeof(source_addr
);
1074 if ((n
= recvmsg(listen
->fd
, &msg
, 0)) == -1)
1077 if (n
< (int)sizeof(struct dns_header
) ||
1078 (msg
.msg_flags
& MSG_TRUNC
) ||
1079 (header
->hb3
& HB3_QR
))
1082 source_addr
.sa
.sa_family
= listen
->family
;
1084 if (listen
->family
== AF_INET
)
1086 /* Source-port == 0 is an error, we can't send back to that.
1087 http://www.ietf.org/mail-archive/web/dnsop/current/msg11441.html */
1088 if (source_addr
.in
.sin_port
== 0)
1094 /* Source-port == 0 is an error, we can't send back to that. */
1095 if (source_addr
.in6
.sin6_port
== 0)
1097 source_addr
.in6
.sin6_flowinfo
= 0;
1101 /* We can be configured to only accept queries from at-most-one-hop-away addresses. */
1102 if (option_bool(OPT_LOCAL_SERVICE
))
1104 struct addrlist
*addr
;
1106 if (listen
->family
== AF_INET6
)
1108 for (addr
= daemon
->interface_addrs
; addr
; addr
= addr
->next
)
1109 if ((addr
->flags
& ADDRLIST_IPV6
) &&
1110 is_same_net6(&addr
->addr
.addr
.addr6
, &source_addr
.in6
.sin6_addr
, addr
->prefixlen
))
1116 struct in_addr netmask
;
1117 for (addr
= daemon
->interface_addrs
; addr
; addr
= addr
->next
)
1119 netmask
.s_addr
= 0xffffffff << (32 - addr
->prefixlen
);
1120 if (!(addr
->flags
& ADDRLIST_IPV6
) &&
1121 is_same_net(addr
->addr
.addr
.addr4
, source_addr
.in
.sin_addr
, netmask
))
1127 static int warned
= 0;
1130 my_syslog(LOG_WARNING
, _("Ignoring query from non-local network"));
1141 if (msg
.msg_controllen
< sizeof(struct cmsghdr
))
1144 #if defined(HAVE_LINUX_NETWORK)
1145 if (listen
->family
== AF_INET
)
1146 for (cmptr
= CMSG_FIRSTHDR(&msg
); cmptr
; cmptr
= CMSG_NXTHDR(&msg
, cmptr
))
1147 if (cmptr
->cmsg_level
== IPPROTO_IP
&& cmptr
->cmsg_type
== IP_PKTINFO
)
1151 struct in_pktinfo
*p
;
1153 p
.c
= CMSG_DATA(cmptr
);
1154 dst_addr_4
= dst_addr
.addr
.addr4
= p
.p
->ipi_spec_dst
;
1155 if_index
= p
.p
->ipi_ifindex
;
1157 #elif defined(IP_RECVDSTADDR) && defined(IP_RECVIF)
1158 if (listen
->family
== AF_INET
)
1160 for (cmptr
= CMSG_FIRSTHDR(&msg
); cmptr
; cmptr
= CMSG_NXTHDR(&msg
, cmptr
))
1166 #ifndef HAVE_SOLARIS_NETWORK
1167 struct sockaddr_dl
*s
;
1170 p
.c
= CMSG_DATA(cmptr
);
1171 if (cmptr
->cmsg_level
== IPPROTO_IP
&& cmptr
->cmsg_type
== IP_RECVDSTADDR
)
1172 dst_addr_4
= dst_addr
.addr
.addr4
= *(p
.a
);
1173 else if (cmptr
->cmsg_level
== IPPROTO_IP
&& cmptr
->cmsg_type
== IP_RECVIF
)
1174 #ifdef HAVE_SOLARIS_NETWORK
1177 if_index
= p
.s
->sdl_index
;
1184 if (listen
->family
== AF_INET6
)
1186 for (cmptr
= CMSG_FIRSTHDR(&msg
); cmptr
; cmptr
= CMSG_NXTHDR(&msg
, cmptr
))
1187 if (cmptr
->cmsg_level
== IPPROTO_IPV6
&& cmptr
->cmsg_type
== daemon
->v6pktinfo
)
1191 struct in6_pktinfo
*p
;
1193 p
.c
= CMSG_DATA(cmptr
);
1195 dst_addr
.addr
.addr6
= p
.p
->ipi6_addr
;
1196 if_index
= p
.p
->ipi6_ifindex
;
1201 /* enforce available interface configuration */
1203 if (!indextoname(listen
->fd
, if_index
, ifr
.ifr_name
))
1206 if (!iface_check(listen
->family
, &dst_addr
, ifr
.ifr_name
, &auth_dns
))
1208 if (!option_bool(OPT_CLEVERBIND
))
1209 enumerate_interfaces(0);
1210 if (!loopback_exception(listen
->fd
, listen
->family
, &dst_addr
, ifr
.ifr_name
) &&
1211 !label_exception(if_index
, listen
->family
, &dst_addr
))
1215 if (listen
->family
== AF_INET
&& option_bool(OPT_LOCALISE
))
1219 /* get the netmask of the interface whch has the address we were sent to.
1220 This is no neccessarily the interface we arrived on. */
1222 for (iface
= daemon
->interfaces
; iface
; iface
= iface
->next
)
1223 if (iface
->addr
.sa
.sa_family
== AF_INET
&&
1224 iface
->addr
.in
.sin_addr
.s_addr
== dst_addr_4
.s_addr
)
1227 /* interface may be new */
1228 if (!iface
&& !option_bool(OPT_CLEVERBIND
))
1229 enumerate_interfaces(0);
1231 for (iface
= daemon
->interfaces
; iface
; iface
= iface
->next
)
1232 if (iface
->addr
.sa
.sa_family
== AF_INET
&&
1233 iface
->addr
.in
.sin_addr
.s_addr
== dst_addr_4
.s_addr
)
1236 /* If we failed, abandon localisation */
1238 netmask
= iface
->netmask
;
1240 dst_addr_4
.s_addr
= 0;
1244 if (extract_request(header
, (size_t)n
, daemon
->namebuff
, &type
))
1247 struct auth_zone
*zone
;
1249 char *types
= querystr(auth_dns
? "auth" : "query", type
);
1251 if (listen
->family
== AF_INET
)
1252 log_query(F_QUERY
| F_IPV4
| F_FORWARD
, daemon
->namebuff
,
1253 (struct all_addr
*)&source_addr
.in
.sin_addr
, types
);
1256 log_query(F_QUERY
| F_IPV6
| F_FORWARD
, daemon
->namebuff
,
1257 (struct all_addr
*)&source_addr
.in6
.sin6_addr
, types
);
1261 /* find queries for zones we're authoritative for, and answer them directly */
1263 for (zone
= daemon
->auth_zones
; zone
; zone
= zone
->next
)
1264 if (in_zone(zone
, daemon
->namebuff
, NULL
))
1276 m
= answer_auth(header
, ((char *) header
) + daemon
->packet_buff_sz
, (size_t)n
, now
, &source_addr
, local_auth
);
1279 send_from(listen
->fd
, option_bool(OPT_NOWILD
) || option_bool(OPT_CLEVERBIND
),
1280 (char *)header
, m
, &source_addr
, &dst_addr
, if_index
);
1281 daemon
->auth_answer
++;
1287 int ad_reqd
, do_bit
;
1288 m
= answer_request(header
, ((char *) header
) + daemon
->packet_buff_sz
, (size_t)n
,
1289 dst_addr_4
, netmask
, now
, &ad_reqd
, &do_bit
);
1293 send_from(listen
->fd
, option_bool(OPT_NOWILD
) || option_bool(OPT_CLEVERBIND
),
1294 (char *)header
, m
, &source_addr
, &dst_addr
, if_index
);
1295 daemon
->local_answer
++;
1297 else if (forward_query(listen
->fd
, &source_addr
, &dst_addr
, if_index
,
1298 header
, (size_t)n
, now
, NULL
, ad_reqd
, do_bit
))
1299 daemon
->queries_forwarded
++;
1301 daemon
->local_answer
++;
1307 /* UDP: we've got an unsigned answer, return STAT_INSECURE if we can prove there's no DS
1308 and therefore the answer shouldn't be signed, or STAT_BOGUS if it should be, or
1309 STAT_NEED_DS_NEG and keyname if we need to do the query. */
1310 static int send_check_sign(time_t now
, struct dns_header
*header
, size_t plen
, char *name
, char *keyname
)
1313 char *name_start
= name
;
1314 int status
= dnssec_chase_cname(now
, header
, plen
, name
, keyname
);
1316 if (status
!= STAT_INSECURE
)
1321 crecp
= cache_find_by_name(NULL
, name_start
, now
, F_DS
);
1323 if (crecp
&& (crecp
->flags
& F_DNSSECOK
))
1324 return (crecp
->flags
& F_NEG
) ? STAT_INSECURE
: STAT_BOGUS
;
1326 if (crecp
&& (crecp
->flags
& F_NEG
) && (name_start
= strchr(name_start
, '.')))
1328 name_start
++; /* chop a label off and try again */
1332 strcpy(keyname
, name_start
);
1333 return STAT_NEED_DS_NEG
;
1337 /* Got answer to DS query from send_check_sign, check for proven non-existence, or make the next DS query to try. */
1338 static int do_check_sign(time_t now
, struct dns_header
*header
, size_t plen
, char *name
, char *keyname
, int class)
1343 int status
= dnssec_validate_ds(now
, header
, plen
, name
, keyname
, class);
1345 if (status
!= STAT_INSECURE
)
1347 if (status
== STAT_NO_DS
)
1348 status
= STAT_INSECURE
;
1352 p
= (unsigned char *)(header
+1);
1354 if (extract_name(header
, plen
, &p
, name
, 1, 4) &&
1355 (name_start
= strchr(name
, '.')))
1357 name_start
++; /* chop a label off and try again */
1358 strcpy(keyname
, name_start
);
1359 return STAT_NEED_DS_NEG
;
1365 /* Move toward the root, until we find a signed non-existance of a DS, in which case
1366 an unsigned answer is OK, or we find a signed DS, in which case there should be
1367 a signature, and the answer is BOGUS */
1368 static int tcp_check_for_unsigned_zone(time_t now
, struct dns_header
*header
, size_t plen
, int class, char *name
,
1369 char *keyname
, struct server
*server
, int *keycount
)
1372 unsigned char *packet
, *payload
;
1374 unsigned char *p
= (unsigned char *)(header
+1);
1376 char *name_start
= name
;
1378 /* Get first insecure entry in CNAME chain */
1379 status
= tcp_key_recurse(now
, STAT_CHASE_CNAME
, header
, plen
, class, name
, keyname
, server
, keycount
);
1380 if (status
== STAT_BOGUS
)
1383 if (!(packet
= whine_malloc(65536 + MAXDNAME
+ RRFIXEDSZ
+ sizeof(u16
))))
1386 payload
= &packet
[2];
1387 header
= (struct dns_header
*)payload
;
1388 length
= (u16
*)packet
;
1392 unsigned char *newhash
, hash
[HASH_SIZE
];
1393 unsigned char c1
, c2
;
1394 struct crec
*crecp
= cache_find_by_name(NULL
, name_start
, now
, F_DS
);
1396 if (--(*keycount
) == 0)
1402 if (crecp
&& (crecp
->flags
& F_DNSSECOK
))
1405 return (crecp
->flags
& F_NEG
) ? STAT_INSECURE
: STAT_BOGUS
;
1408 /* If we have cached insecurely that a DS doesn't exist,
1409 ise that is a hit for where to start looking for the secure one */
1410 if (crecp
&& (crecp
->flags
& F_NEG
) && (name_start
= strchr(name_start
, '.')))
1412 name_start
++; /* chop a label off and try again */
1416 m
= dnssec_generate_query(header
, ((char *) header
) + 65536, name_start
, class, T_DS
, &server
->addr
);
1418 /* We rely on the question section coming back unchanged, ensure it is with the hash. */
1419 if ((newhash
= hash_questions(header
, (unsigned int)m
, name
)))
1420 memcpy(hash
, newhash
, HASH_SIZE
);
1424 if (read_write(server
->tcpfd
, packet
, m
+ sizeof(u16
), 0) &&
1425 read_write(server
->tcpfd
, &c1
, 1, 1) &&
1426 read_write(server
->tcpfd
, &c2
, 1, 1) &&
1427 read_write(server
->tcpfd
, payload
, (c1
<< 8) | c2
, 1))
1431 newhash
= hash_questions(header
, (unsigned int)m
, name
);
1432 if (newhash
&& memcmp(hash
, newhash
, HASH_SIZE
) == 0)
1434 /* Note this trashes all three name workspaces */
1435 status
= tcp_key_recurse(now
, STAT_NEED_DS_NEG
, header
, m
, class, name
, keyname
, server
, keycount
);
1437 /* We've found a DS which proves the bit of the DNS where the
1438 original query is, is unsigned, so the answer is OK,
1440 if (status
== STAT_NO_DS
)
1443 return STAT_INSECURE
;
1446 /* No DS, not got to DNSSEC-land yet, go up. */
1447 if (status
== STAT_INSECURE
)
1449 p
= (unsigned char *)(header
+1);
1451 if (extract_name(header
, plen
, &p
, name
, 1, 4) &&
1452 (name_start
= strchr(name
, '.')))
1454 name_start
++; /* chop a label off and try again */
1467 static int tcp_key_recurse(time_t now
, int status
, struct dns_header
*header
, size_t n
,
1468 int class, char *name
, char *keyname
, struct server
*server
, int *keycount
)
1470 /* Recurse up the key heirarchy */
1473 /* limit the amount of work we do, to avoid cycling forever on loops in the DNS */
1474 if (--(*keycount
) == 0)
1475 return STAT_INSECURE
;
1477 if (status
== STAT_NEED_KEY
)
1478 new_status
= dnssec_validate_by_ds(now
, header
, n
, name
, keyname
, class);
1479 else if (status
== STAT_NEED_DS
|| status
== STAT_NEED_DS_NEG
)
1481 new_status
= dnssec_validate_ds(now
, header
, n
, name
, keyname
, class);
1482 if (status
== STAT_NEED_DS
&& new_status
== STAT_NO_DS
)
1483 new_status
= STAT_INSECURE
;
1485 else if (status
== STAT_CHASE_CNAME
)
1486 new_status
= dnssec_chase_cname(now
, header
, n
, name
, keyname
);
1489 new_status
= dnssec_validate_reply(now
, header
, n
, name
, keyname
, &class, NULL
);
1491 if (new_status
== STAT_NO_SIG
)
1493 if (option_bool(OPT_DNSSEC_NO_SIGN
))
1494 new_status
= tcp_check_for_unsigned_zone(now
, header
, n
, class, name
, keyname
, server
, keycount
);
1496 new_status
= STAT_INSECURE
;
1500 /* Can't validate because we need a key/DS whose name now in keyname.
1501 Make query for same, and recurse to validate */
1502 if (new_status
== STAT_NEED_DS
|| new_status
== STAT_NEED_KEY
)
1505 unsigned char *packet
= whine_malloc(65536 + MAXDNAME
+ RRFIXEDSZ
+ sizeof(u16
));
1506 unsigned char *payload
= &packet
[2];
1507 struct dns_header
*new_header
= (struct dns_header
*)payload
;
1508 u16
*length
= (u16
*)packet
;
1509 unsigned char c1
, c2
;
1512 return STAT_INSECURE
;
1515 m
= dnssec_generate_query(new_header
, ((char *) new_header
) + 65536, keyname
, class,
1516 new_status
== STAT_NEED_KEY
? T_DNSKEY
: T_DS
, &server
->addr
);
1520 if (!read_write(server
->tcpfd
, packet
, m
+ sizeof(u16
), 0) ||
1521 !read_write(server
->tcpfd
, &c1
, 1, 1) ||
1522 !read_write(server
->tcpfd
, &c2
, 1, 1) ||
1523 !read_write(server
->tcpfd
, payload
, (c1
<< 8) | c2
, 1))
1524 new_status
= STAT_INSECURE
;
1529 new_status
= tcp_key_recurse(now
, new_status
, new_header
, m
, class, name
, keyname
, server
, keycount
);
1531 if (new_status
== STAT_SECURE
)
1533 /* Reached a validated record, now try again at this level.
1534 Note that we may get ANOTHER NEED_* if an answer needs more than one key.
1535 If so, go round again. */
1537 if (status
== STAT_NEED_KEY
)
1538 new_status
= dnssec_validate_by_ds(now
, header
, n
, name
, keyname
, class);
1539 else if (status
== STAT_NEED_DS
|| status
== STAT_NEED_DS_NEG
)
1541 new_status
= dnssec_validate_ds(now
, header
, n
, name
, keyname
, class);
1542 if (status
== STAT_NEED_DS
&& new_status
== STAT_NO_DS
)
1543 new_status
= STAT_INSECURE
; /* Validated no DS */
1545 else if (status
== STAT_CHASE_CNAME
)
1546 new_status
= dnssec_chase_cname(now
, header
, n
, name
, keyname
);
1549 new_status
= dnssec_validate_reply(now
, header
, n
, name
, keyname
, &class, NULL
);
1551 if (new_status
== STAT_NO_SIG
)
1553 if (option_bool(OPT_DNSSEC_NO_SIGN
))
1554 new_status
= tcp_check_for_unsigned_zone(now
, header
, n
, class, name
, keyname
, server
, keycount
);
1556 new_status
= STAT_INSECURE
;
1560 if (new_status
== STAT_NEED_DS
|| new_status
== STAT_NEED_KEY
)
1561 goto another_tcp_key
;
1572 /* The daemon forks before calling this: it should deal with one connection,
1573 blocking as neccessary, and then return. Note, need to be a bit careful
1574 about resources for debug mode, when the fork is suppressed: that's
1575 done by the caller. */
1576 unsigned char *tcp_request(int confd
, time_t now
,
1577 union mysockaddr
*local_addr
, struct in_addr netmask
, int auth_dns
)
1584 int checking_disabled
, ad_question
, do_bit
, added_pheader
= 0;
1585 int check_subnet
, no_cache_dnssec
= 0, cache_secure
= 0;
1587 unsigned short qtype
;
1588 unsigned int gotname
;
1589 unsigned char c1
, c2
;
1590 /* Max TCP packet + slop + size */
1591 unsigned char *packet
= whine_malloc(65536 + MAXDNAME
+ RRFIXEDSZ
+ sizeof(u16
));
1592 unsigned char *payload
= &packet
[2];
1593 /* largest field in header is 16-bits, so this is still sufficiently aligned */
1594 struct dns_header
*header
= (struct dns_header
*)payload
;
1595 u16
*length
= (u16
*)packet
;
1596 struct server
*last_server
;
1597 struct in_addr dst_addr_4
;
1598 union mysockaddr peer_addr
;
1599 socklen_t peer_len
= sizeof(union mysockaddr
);
1601 if (getpeername(confd
, (struct sockaddr
*)&peer_addr
, &peer_len
) == -1)
1604 /* We can be configured to only accept queries from at-most-one-hop-away addresses. */
1605 if (option_bool(OPT_LOCAL_SERVICE
))
1607 struct addrlist
*addr
;
1609 if (peer_addr
.sa
.sa_family
== AF_INET6
)
1611 for (addr
= daemon
->interface_addrs
; addr
; addr
= addr
->next
)
1612 if ((addr
->flags
& ADDRLIST_IPV6
) &&
1613 is_same_net6(&addr
->addr
.addr
.addr6
, &peer_addr
.in6
.sin6_addr
, addr
->prefixlen
))
1619 struct in_addr netmask
;
1620 for (addr
= daemon
->interface_addrs
; addr
; addr
= addr
->next
)
1622 netmask
.s_addr
= 0xffffffff << (32 - addr
->prefixlen
);
1623 if (!(addr
->flags
& ADDRLIST_IPV6
) &&
1624 is_same_net(addr
->addr
.addr
.addr4
, peer_addr
.in
.sin_addr
, netmask
))
1630 my_syslog(LOG_WARNING
, _("Ignoring query from non-local network"));
1638 !read_write(confd
, &c1
, 1, 1) || !read_write(confd
, &c2
, 1, 1) ||
1639 !(size
= c1
<< 8 | c2
) ||
1640 !read_write(confd
, payload
, size
, 1))
1643 if (size
< (int)sizeof(struct dns_header
))
1648 /* save state of "cd" flag in query */
1649 if ((checking_disabled
= header
->hb4
& HB4_CD
))
1650 no_cache_dnssec
= 1;
1652 if ((gotname
= extract_request(header
, (unsigned int)size
, daemon
->namebuff
, &qtype
)))
1655 struct auth_zone
*zone
;
1657 char *types
= querystr(auth_dns
? "auth" : "query", qtype
);
1659 if (peer_addr
.sa
.sa_family
== AF_INET
)
1660 log_query(F_QUERY
| F_IPV4
| F_FORWARD
, daemon
->namebuff
,
1661 (struct all_addr
*)&peer_addr
.in
.sin_addr
, types
);
1664 log_query(F_QUERY
| F_IPV6
| F_FORWARD
, daemon
->namebuff
,
1665 (struct all_addr
*)&peer_addr
.in6
.sin6_addr
, types
);
1669 /* find queries for zones we're authoritative for, and answer them directly */
1671 for (zone
= daemon
->auth_zones
; zone
; zone
= zone
->next
)
1672 if (in_zone(zone
, daemon
->namebuff
, NULL
))
1681 if (local_addr
->sa
.sa_family
== AF_INET
)
1682 dst_addr_4
= local_addr
->in
.sin_addr
;
1684 dst_addr_4
.s_addr
= 0;
1688 m
= answer_auth(header
, ((char *) header
) + 65536, (size_t)size
, now
, &peer_addr
, local_auth
);
1692 /* m > 0 if answered from cache */
1693 m
= answer_request(header
, ((char *) header
) + 65536, (size_t)size
,
1694 dst_addr_4
, netmask
, now
, &ad_question
, &do_bit
);
1696 /* Do this by steam now we're not in the select() loop */
1697 check_log_writer(NULL
);
1701 unsigned int flags
= 0;
1702 struct all_addr
*addrp
= NULL
;
1704 char *domain
= NULL
;
1706 if (option_bool(OPT_ADD_MAC
))
1707 size
= add_mac(header
, size
, ((char *) header
) + 65536, &peer_addr
);
1709 if (option_bool(OPT_CLIENT_SUBNET
))
1711 size_t new = add_source_addr(header
, size
, ((char *) header
) + 65536, &peer_addr
);
1720 flags
= search_servers(now
, &addrp
, gotname
, daemon
->namebuff
, &type
, &domain
, &norebind
);
1722 if (type
!= 0 || option_bool(OPT_ORDER
) || !daemon
->last_server
)
1723 last_server
= daemon
->servers
;
1725 last_server
= daemon
->last_server
;
1727 if (!flags
&& last_server
)
1729 struct server
*firstsendto
= NULL
;
1731 unsigned char *newhash
, hash
[HASH_SIZE
];
1732 if ((newhash
= hash_questions(header
, (unsigned int)size
, daemon
->keyname
)))
1733 memcpy(hash
, newhash
, HASH_SIZE
);
1735 unsigned int crc
= questions_crc(header
, (unsigned int)size
, daemon
->namebuff
);
1737 /* Loop round available servers until we succeed in connecting to one.
1738 Note that this code subtley ensures that consecutive queries on this connection
1739 which can go to the same server, do so. */
1743 firstsendto
= last_server
;
1746 if (!(last_server
= last_server
->next
))
1747 last_server
= daemon
->servers
;
1749 if (last_server
== firstsendto
)
1753 /* server for wrong domain */
1754 if (type
!= (last_server
->flags
& SERV_TYPE
) ||
1755 (type
== SERV_HAS_DOMAIN
&& !hostname_isequal(domain
, last_server
->domain
)))
1758 if (last_server
->tcpfd
== -1)
1760 if ((last_server
->tcpfd
= socket(last_server
->addr
.sa
.sa_family
, SOCK_STREAM
, 0)) == -1)
1763 if ((!local_bind(last_server
->tcpfd
, &last_server
->source_addr
, last_server
->interface
, 1) ||
1764 connect(last_server
->tcpfd
, &last_server
->addr
.sa
, sa_len(&last_server
->addr
)) == -1))
1766 close(last_server
->tcpfd
);
1767 last_server
->tcpfd
= -1;
1772 if (option_bool(OPT_DNSSEC_VALID
))
1774 size_t new_size
= add_do_bit(header
, size
, ((char *) header
) + 65536);
1776 /* For debugging, set Checking Disabled, otherwise, have the upstream check too,
1777 this allows it to select auth servers when one is returning bad data. */
1778 if (option_bool(OPT_DNSSEC_DEBUG
))
1779 header
->hb4
|= HB4_CD
;
1781 if (size
!= new_size
)
1788 #ifdef HAVE_CONNTRACK
1789 /* Copy connection mark of incoming query to outgoing connection. */
1790 if (option_bool(OPT_CONNTRACK
))
1793 struct all_addr local
;
1795 if (local_addr
->sa
.sa_family
== AF_INET6
)
1796 local
.addr
.addr6
= local_addr
->in6
.sin6_addr
;
1799 local
.addr
.addr4
= local_addr
->in
.sin_addr
;
1801 if (get_incoming_mark(&peer_addr
, &local
, 1, &mark
))
1802 setsockopt(last_server
->tcpfd
, SOL_SOCKET
, SO_MARK
, &mark
, sizeof(unsigned int));
1807 *length
= htons(size
);
1809 if (!read_write(last_server
->tcpfd
, packet
, size
+ sizeof(u16
), 0) ||
1810 !read_write(last_server
->tcpfd
, &c1
, 1, 1) ||
1811 !read_write(last_server
->tcpfd
, &c2
, 1, 1) ||
1812 !read_write(last_server
->tcpfd
, payload
, (c1
<< 8) | c2
, 1))
1814 close(last_server
->tcpfd
);
1815 last_server
->tcpfd
= -1;
1822 strcpy(daemon
->namebuff
, "query");
1823 if (last_server
->addr
.sa
.sa_family
== AF_INET
)
1824 log_query(F_SERVER
| F_IPV4
| F_FORWARD
, daemon
->namebuff
,
1825 (struct all_addr
*)&last_server
->addr
.in
.sin_addr
, NULL
);
1828 log_query(F_SERVER
| F_IPV6
| F_FORWARD
, daemon
->namebuff
,
1829 (struct all_addr
*)&last_server
->addr
.in6
.sin6_addr
, NULL
);
1833 if (option_bool(OPT_DNSSEC_VALID
) && !checking_disabled
)
1835 int keycount
= DNSSEC_WORK
; /* Limit to number of DNSSEC questions, to catch loops and avoid filling cache. */
1836 int status
= tcp_key_recurse(now
, STAT_TRUNCATED
, header
, m
, 0, daemon
->namebuff
, daemon
->keyname
, last_server
, &keycount
);
1840 result
= "ABANDONED";
1842 result
= (status
== STAT_SECURE
? "SECURE" : (status
== STAT_INSECURE
? "INSECURE" : "BOGUS"));
1844 log_query(F_KEYTAG
| F_SECSTAT
, "result", NULL
, result
);
1846 if (status
== STAT_BOGUS
)
1847 no_cache_dnssec
= 1;
1849 if (status
== STAT_SECURE
)
1854 /* restore CD bit to the value in the query */
1855 if (checking_disabled
)
1856 header
->hb4
|= HB4_CD
;
1858 header
->hb4
&= ~HB4_CD
;
1860 /* There's no point in updating the cache, since this process will exit and
1861 lose the information after a few queries. We make this call for the alias and
1862 bogus-nxdomain side-effects. */
1863 /* If the crc of the question section doesn't match the crc we sent, then
1864 someone might be attempting to insert bogus values into the cache by
1865 sending replies containing questions and bogus answers. */
1867 newhash
= hash_questions(header
, (unsigned int)m
, daemon
->namebuff
);
1868 if (!newhash
|| memcmp(hash
, newhash
, HASH_SIZE
) != 0)
1874 if (crc
!= questions_crc(header
, (unsigned int)m
, daemon
->namebuff
))
1881 m
= process_reply(header
, now
, last_server
, (unsigned int)m
,
1882 option_bool(OPT_NO_REBIND
) && !norebind
, no_cache_dnssec
,
1883 cache_secure
, ad_question
, do_bit
, added_pheader
, check_subnet
, &peer_addr
);
1889 /* In case of local answer or no connections made. */
1891 m
= setup_reply(header
, (unsigned int)size
, addrp
, flags
, daemon
->local_ttl
);
1895 check_log_writer(NULL
);
1899 if (m
== 0 || !read_write(confd
, packet
, m
+ sizeof(u16
), 0))
1904 static struct frec
*allocate_frec(time_t now
)
1908 if ((f
= (struct frec
*)whine_malloc(sizeof(struct frec
))))
1910 f
->next
= daemon
->frec_list
;
1919 f
->dependent
= NULL
;
1920 f
->blocking_query
= NULL
;
1923 daemon
->frec_list
= f
;
1929 static struct randfd
*allocate_rfd(int family
)
1931 static int finger
= 0;
1934 /* limit the number of sockets we have open to avoid starvation of
1935 (eg) TFTP. Once we have a reasonable number, randomness should be OK */
1937 for (i
= 0; i
< RANDOM_SOCKS
; i
++)
1938 if (daemon
->randomsocks
[i
].refcount
== 0)
1940 if ((daemon
->randomsocks
[i
].fd
= random_sock(family
)) == -1)
1943 daemon
->randomsocks
[i
].refcount
= 1;
1944 daemon
->randomsocks
[i
].family
= family
;
1945 return &daemon
->randomsocks
[i
];
1948 /* No free ones or cannot get new socket, grab an existing one */
1949 for (i
= 0; i
< RANDOM_SOCKS
; i
++)
1951 int j
= (i
+finger
) % RANDOM_SOCKS
;
1952 if (daemon
->randomsocks
[j
].refcount
!= 0 &&
1953 daemon
->randomsocks
[j
].family
== family
&&
1954 daemon
->randomsocks
[j
].refcount
!= 0xffff)
1957 daemon
->randomsocks
[j
].refcount
++;
1958 return &daemon
->randomsocks
[j
];
1962 return NULL
; /* doom */
1964 static void free_frec(struct frec
*f
)
1966 if (f
->rfd4
&& --(f
->rfd4
->refcount
) == 0)
1974 if (f
->rfd6
&& --(f
->rfd6
->refcount
) == 0)
1983 blockdata_free(f
->stash
);
1987 /* Anything we're waiting on is pointless now, too */
1988 if (f
->blocking_query
)
1989 free_frec(f
->blocking_query
);
1990 f
->blocking_query
= NULL
;
1991 f
->dependent
= NULL
;
1995 /* if wait==NULL return a free or older than TIMEOUT record.
1996 else return *wait zero if one available, or *wait is delay to
1997 when the oldest in-use record will expire. Impose an absolute
1998 limit of 4*TIMEOUT before we wipe things (for random sockets).
1999 If force is set, always return a result, even if we have
2000 to allocate above the limit. */
2001 struct frec
*get_new_frec(time_t now
, int *wait
, int force
)
2003 struct frec
*f
, *oldest
, *target
;
2009 for (f
= daemon
->frec_list
, oldest
= NULL
, target
= NULL
, count
= 0; f
; f
= f
->next
, count
++)
2014 if (difftime(now
, f
->time
) >= 4*TIMEOUT
)
2020 if (!oldest
|| difftime(f
->time
, oldest
->time
) <= 0)
2030 /* can't find empty one, use oldest if there is one
2031 and it's older than timeout */
2032 if (oldest
&& ((int)difftime(now
, oldest
->time
)) >= TIMEOUT
)
2034 /* keep stuff for twice timeout if we can by allocating a new
2036 if (difftime(now
, oldest
->time
) < 2*TIMEOUT
&&
2037 count
<= daemon
->ftabsize
&&
2038 (f
= allocate_frec(now
)))
2049 /* none available, calculate time 'till oldest record expires */
2050 if (!force
&& count
> daemon
->ftabsize
)
2052 static time_t last_log
= 0;
2055 *wait
= oldest
->time
+ (time_t)TIMEOUT
- now
;
2057 if ((int)difftime(now
, last_log
) > 5)
2060 my_syslog(LOG_WARNING
, _("Maximum number of concurrent DNS queries reached (max: %d)"), daemon
->ftabsize
);
2066 if (!(f
= allocate_frec(now
)) && wait
)
2067 /* wait one second on malloc failure */
2070 return f
; /* OK if malloc fails and this is NULL */
2073 /* crc is all-ones if not known. */
2074 static struct frec
*lookup_frec(unsigned short id
, void *hash
)
2078 for(f
= daemon
->frec_list
; f
; f
= f
->next
)
2079 if (f
->sentto
&& f
->new_id
== id
&&
2080 (!hash
|| memcmp(hash
, f
->hash
, HASH_SIZE
) == 0))
2086 static struct frec
*lookup_frec_by_sender(unsigned short id
,
2087 union mysockaddr
*addr
,
2092 for(f
= daemon
->frec_list
; f
; f
= f
->next
)
2095 memcmp(hash
, f
->hash
, HASH_SIZE
) == 0 &&
2096 sockaddr_isequal(&f
->source
, addr
))
2102 /* A server record is going away, remove references to it */
2103 void server_gone(struct server
*server
)
2107 for (f
= daemon
->frec_list
; f
; f
= f
->next
)
2108 if (f
->sentto
&& f
->sentto
== server
)
2111 if (daemon
->last_server
== server
)
2112 daemon
->last_server
= NULL
;
2114 if (daemon
->srv_save
== server
)
2115 daemon
->srv_save
= NULL
;
2118 /* return unique random ids. */
2119 static unsigned short get_id(void)
2121 unsigned short ret
= 0;
2125 while (lookup_frec(ret
, NULL
));