]> git.ipfire.org Git - people/ms/dnsmasq.git/blame - src/forward.c
SERVFAIL is an expected error return, don't try all servers.
[people/ms/dnsmasq.git] / src / forward.c
CommitLineData
c47e3ba4 1/* dnsmasq is Copyright (c) 2000-2014 Simon Kelley
9e4abcb5
SK
2
3 This program is free software; you can redistribute it and/or modify
4 it under the terms of the GNU General Public License as published by
824af85b
SK
5 the Free Software Foundation; version 2 dated June, 1991, or
6 (at your option) version 3 dated 29 June, 2007.
7
9e4abcb5
SK
8 This program is distributed in the hope that it will be useful,
9 but WITHOUT ANY WARRANTY; without even the implied warranty of
10 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11 GNU General Public License for more details.
824af85b 12
73a08a24
SK
13 You should have received a copy of the GNU General Public License
14 along with this program. If not, see <http://www.gnu.org/licenses/>.
9e4abcb5
SK
15*/
16
9e4abcb5
SK
17#include "dnsmasq.h"
18
8a9be9e4 19static struct frec *lookup_frec(unsigned short id, void *hash);
9e4abcb5 20static struct frec *lookup_frec_by_sender(unsigned short id,
fd9fa481 21 union mysockaddr *addr,
8a9be9e4
SK
22 void *hash);
23static unsigned short get_id(void);
1a6bca81
SK
24static void free_frec(struct frec *f);
25static struct randfd *allocate_rfd(int family);
9e4abcb5 26
00a5b5d4
SK
27#ifdef HAVE_DNSSEC
28static int tcp_key_recurse(time_t now, int status, struct dns_header *header, size_t n,
29 int class, char *name, char *keyname, struct server *server, int *keycount);
30static int do_check_sign(time_t now, struct dns_header *header, size_t plen, char *name, char *keyname, int class);
31static int send_check_sign(time_t now, struct dns_header *header, size_t plen, char *name, char *keyname);
32#endif
33
34
824af85b 35/* Send a UDP packet with its source address set as "source"
44a2a316 36 unless nowild is true, when we just send it with the kernel default */
29689cfa
SK
37int send_from(int fd, int nowild, char *packet, size_t len,
38 union mysockaddr *to, struct all_addr *source,
50303b19 39 unsigned int iface)
9e4abcb5 40{
44a2a316
SK
41 struct msghdr msg;
42 struct iovec iov[1];
44a2a316
SK
43 union {
44 struct cmsghdr align; /* this ensures alignment */
5e9e0efb 45#if defined(HAVE_LINUX_NETWORK)
44a2a316
SK
46 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
47#elif defined(IP_SENDSRCADDR)
48 char control[CMSG_SPACE(sizeof(struct in_addr))];
49#endif
50#ifdef HAVE_IPV6
51 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
52#endif
53 } control_u;
feba5c1d 54
44a2a316
SK
55 iov[0].iov_base = packet;
56 iov[0].iov_len = len;
57
feba5c1d
SK
58 msg.msg_control = NULL;
59 msg.msg_controllen = 0;
44a2a316
SK
60 msg.msg_flags = 0;
61 msg.msg_name = to;
62 msg.msg_namelen = sa_len(to);
63 msg.msg_iov = iov;
64 msg.msg_iovlen = 1;
feba5c1d 65
26128d27 66 if (!nowild)
44a2a316 67 {
26128d27 68 struct cmsghdr *cmptr;
feba5c1d
SK
69 msg.msg_control = &control_u;
70 msg.msg_controllen = sizeof(control_u);
26128d27
SK
71 cmptr = CMSG_FIRSTHDR(&msg);
72
73 if (to->sa.sa_family == AF_INET)
74 {
5e9e0efb 75#if defined(HAVE_LINUX_NETWORK)
8ef5ada2
SK
76 struct in_pktinfo p;
77 p.ipi_ifindex = 0;
78 p.ipi_spec_dst = source->addr.addr4;
79 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
26128d27 80 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_pktinfo));
c72daea8 81 cmptr->cmsg_level = IPPROTO_IP;
26128d27 82 cmptr->cmsg_type = IP_PKTINFO;
44a2a316 83#elif defined(IP_SENDSRCADDR)
8ef5ada2 84 memcpy(CMSG_DATA(cmptr), &(source->addr.addr4), sizeof(source->addr.addr4));
26128d27
SK
85 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_addr));
86 cmptr->cmsg_level = IPPROTO_IP;
87 cmptr->cmsg_type = IP_SENDSRCADDR;
44a2a316 88#endif
26128d27 89 }
26128d27 90 else
b8187c80 91#ifdef HAVE_IPV6
26128d27 92 {
8ef5ada2
SK
93 struct in6_pktinfo p;
94 p.ipi6_ifindex = iface; /* Need iface for IPv6 to handle link-local addrs */
95 p.ipi6_addr = source->addr.addr6;
96 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
26128d27 97 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in6_pktinfo));
316e2730 98 cmptr->cmsg_type = daemon->v6pktinfo;
c72daea8 99 cmptr->cmsg_level = IPPROTO_IPV6;
26128d27 100 }
3d8df260 101#else
c72daea8 102 (void)iface; /* eliminate warning */
44a2a316 103#endif
26128d27 104 }
feba5c1d 105
29d28dda 106 while (sendmsg(fd, &msg, 0) == -1)
feba5c1d 107 {
fd9fa481 108 if (retry_send())
29d28dda 109 continue;
22d904db 110
29d28dda
SK
111 /* If interface is still in DAD, EINVAL results - ignore that. */
112 if (errno == EINVAL)
113 break;
29689cfa 114
29d28dda 115 my_syslog(LOG_ERR, _("failed to send packet: %s"), strerror(errno));
29689cfa 116 return 0;
feba5c1d 117 }
29d28dda 118
29689cfa 119 return 1;
9e4abcb5 120}
44a2a316 121
28866e95
SK
122static unsigned int search_servers(time_t now, struct all_addr **addrpp,
123 unsigned int qtype, char *qdomain, int *type, char **domain, int *norebind)
feba5c1d
SK
124
125{
126 /* If the query ends in the domain in one of our servers, set
127 domain to point to that name. We find the largest match to allow both
128 domain.org and sub.domain.org to exist. */
129
130 unsigned int namelen = strlen(qdomain);
131 unsigned int matchlen = 0;
132 struct server *serv;
28866e95 133 unsigned int flags = 0;
feba5c1d 134
3be34541 135 for (serv = daemon->servers; serv; serv=serv->next)
feba5c1d 136 /* domain matches take priority over NODOTS matches */
3d8df260 137 if ((serv->flags & SERV_FOR_NODOTS) && *type != SERV_HAS_DOMAIN && !strchr(qdomain, '.') && namelen != 0)
feba5c1d 138 {
28866e95 139 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
feba5c1d 140 *type = SERV_FOR_NODOTS;
feba5c1d 141 if (serv->flags & SERV_NO_ADDR)
36717eee
SK
142 flags = F_NXDOMAIN;
143 else if (serv->flags & SERV_LITERAL_ADDRESS)
144 {
145 if (sflag & qtype)
146 {
147 flags = sflag;
148 if (serv->addr.sa.sa_family == AF_INET)
149 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
feba5c1d 150#ifdef HAVE_IPV6
36717eee
SK
151 else
152 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
feba5c1d 153#endif
36717eee 154 }
824af85b 155 else if (!flags || (flags & F_NXDOMAIN))
36717eee
SK
156 flags = F_NOERR;
157 }
feba5c1d
SK
158 }
159 else if (serv->flags & SERV_HAS_DOMAIN)
160 {
161 unsigned int domainlen = strlen(serv->domain);
b8187c80 162 char *matchstart = qdomain + namelen - domainlen;
feba5c1d 163 if (namelen >= domainlen &&
b8187c80 164 hostname_isequal(matchstart, serv->domain) &&
8ef5ada2 165 (domainlen == 0 || namelen == domainlen || *(matchstart-1) == '.' ))
feba5c1d 166 {
8ef5ada2
SK
167 if (serv->flags & SERV_NO_REBIND)
168 *norebind = 1;
28866e95 169 else
feba5c1d 170 {
28866e95
SK
171 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
172 /* implement priority rules for --address and --server for same domain.
173 --address wins if the address is for the correct AF
174 --server wins otherwise. */
175 if (domainlen != 0 && domainlen == matchlen)
36717eee 176 {
28866e95 177 if ((serv->flags & SERV_LITERAL_ADDRESS))
8ef5ada2 178 {
28866e95
SK
179 if (!(sflag & qtype) && flags == 0)
180 continue;
181 }
182 else
183 {
184 if (flags & (F_IPV4 | F_IPV6))
185 continue;
186 }
187 }
188
189 if (domainlen >= matchlen)
190 {
191 *type = serv->flags & (SERV_HAS_DOMAIN | SERV_USE_RESOLV | SERV_NO_REBIND);
192 *domain = serv->domain;
193 matchlen = domainlen;
194 if (serv->flags & SERV_NO_ADDR)
195 flags = F_NXDOMAIN;
196 else if (serv->flags & SERV_LITERAL_ADDRESS)
197 {
198 if (sflag & qtype)
199 {
200 flags = sflag;
201 if (serv->addr.sa.sa_family == AF_INET)
202 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
feba5c1d 203#ifdef HAVE_IPV6
28866e95
SK
204 else
205 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
feba5c1d 206#endif
28866e95
SK
207 }
208 else if (!flags || (flags & F_NXDOMAIN))
209 flags = F_NOERR;
8ef5ada2 210 }
28866e95
SK
211 else
212 flags = 0;
213 }
214 }
8ef5ada2 215 }
feba5c1d 216 }
8ef5ada2 217
7de060b0 218 if (flags == 0 && !(qtype & F_QUERY) &&
28866e95 219 option_bool(OPT_NODOTS_LOCAL) && !strchr(qdomain, '.') && namelen != 0)
7de060b0
SK
220 /* don't forward A or AAAA queries for simple names, except the empty name */
221 flags = F_NOERR;
8ef5ada2 222
5aabfc78 223 if (flags == F_NXDOMAIN && check_for_local_domain(qdomain, now))
c1bb8504 224 flags = F_NOERR;
feba5c1d 225
824af85b
SK
226 if (flags)
227 {
228 int logflags = 0;
229
230 if (flags == F_NXDOMAIN || flags == F_NOERR)
231 logflags = F_NEG | qtype;
232
1a6bca81 233 log_query(logflags | flags | F_CONFIG | F_FORWARD, qdomain, *addrpp, NULL);
824af85b 234 }
8ef5ada2
SK
235 else if ((*type) & SERV_USE_RESOLV)
236 {
237 *type = 0; /* use normal servers for this domain */
238 *domain = NULL;
239 }
feba5c1d
SK
240 return flags;
241}
44a2a316 242
824af85b
SK
243static int forward_query(int udpfd, union mysockaddr *udpaddr,
244 struct all_addr *dst_addr, unsigned int dst_iface,
83349b8a 245 struct dns_header *header, size_t plen, time_t now,
613ad15d 246 struct frec *forward, int ad_reqd, int do_bit)
9e4abcb5 247{
9e4abcb5 248 char *domain = NULL;
8ef5ada2 249 int type = 0, norebind = 0;
9e4abcb5 250 struct all_addr *addrp = NULL;
28866e95 251 unsigned int flags = 0;
de37951c 252 struct server *start = NULL;
8a9be9e4
SK
253#ifdef HAVE_DNSSEC
254 void *hash = hash_questions(header, plen, daemon->namebuff);
255#else
256 unsigned int crc = questions_crc(header, plen, daemon->namebuff);
257 void *hash = &crc;
258#endif
259 unsigned int gotname = extract_request(header, plen, daemon->namebuff, NULL);
260
00a5b5d4
SK
261 (void)do_bit;
262
3d8df260
SK
263 /* may be no servers available. */
264 if (!daemon->servers)
9e4abcb5 265 forward = NULL;
8a9be9e4 266 else if (forward || (hash && (forward = lookup_frec_by_sender(ntohs(header->id), udpaddr, hash))))
9e4abcb5 267 {
e0c0ad3b 268#ifdef HAVE_DNSSEC
dac74312 269 /* If we've already got an answer to this query, but we're awaiting keys for validation,
e0c0ad3b
SK
270 there's no point retrying the query, retry the key query instead...... */
271 if (forward->blocking_query)
272 {
273 int fd;
274
275 while (forward->blocking_query)
276 forward = forward->blocking_query;
277
278 blockdata_retrieve(forward->stash, forward->stash_len, (void *)header);
279 plen = forward->stash_len;
280
2b29191e 281 if (forward->sentto->addr.sa.sa_family == AF_INET)
e0c0ad3b
SK
282 log_query(F_DNSSEC | F_IPV4, "retry", (struct all_addr *)&forward->sentto->addr.in.sin_addr, "dnssec");
283#ifdef HAVE_IPV6
284 else
285 log_query(F_DNSSEC | F_IPV6, "retry", (struct all_addr *)&forward->sentto->addr.in6.sin6_addr, "dnssec");
286#endif
287
288 if (forward->sentto->sfd)
289 fd = forward->sentto->sfd->fd;
290 else
291 {
292#ifdef HAVE_IPV6
293 if (forward->sentto->addr.sa.sa_family == AF_INET6)
294 fd = forward->rfd6->fd;
295 else
296#endif
297 fd = forward->rfd4->fd;
298 }
299
300 while (sendto(fd, (char *)header, plen, 0,
301 &forward->sentto->addr.sa,
2b29191e 302 sa_len(&forward->sentto->addr)) == -1 && retry_send());
e0c0ad3b
SK
303
304 return 1;
305 }
306#endif
307
de37951c 308 /* retry on existing query, send to all available servers */
9e4abcb5 309 domain = forward->sentto->domain;
824af85b 310 forward->sentto->failed_queries++;
28866e95 311 if (!option_bool(OPT_ORDER))
de37951c 312 {
0a852541 313 forward->forwardall = 1;
3be34541 314 daemon->last_server = NULL;
de37951c 315 }
9e4abcb5 316 type = forward->sentto->flags & SERV_TYPE;
de37951c 317 if (!(start = forward->sentto->next))
3be34541 318 start = daemon->servers; /* at end of list, recycle */
9e4abcb5
SK
319 header->id = htons(forward->new_id);
320 }
321 else
322 {
323 if (gotname)
8ef5ada2 324 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
9e4abcb5 325
3a237152 326 if (!flags && !(forward = get_new_frec(now, NULL, 0)))
feba5c1d
SK
327 /* table full - server failure. */
328 flags = F_NEG;
9e4abcb5
SK
329
330 if (forward)
331 {
0a852541
SK
332 forward->source = *udpaddr;
333 forward->dest = *dst_addr;
334 forward->iface = dst_iface;
0a852541 335 forward->orig_id = ntohs(header->id);
8a9be9e4 336 forward->new_id = get_id();
832af0ba 337 forward->fd = udpfd;
8a9be9e4 338 memcpy(forward->hash, hash, HASH_SIZE);
0a852541 339 forward->forwardall = 0;
ed4c0767 340 forward->flags = 0;
28866e95
SK
341 if (norebind)
342 forward->flags |= FREC_NOREBIND;
572b41eb 343 if (header->hb4 & HB4_CD)
28866e95 344 forward->flags |= FREC_CHECKING_DISABLED;
83349b8a
SK
345 if (ad_reqd)
346 forward->flags |= FREC_AD_QUESTION;
7fa836e1
SK
347#ifdef HAVE_DNSSEC
348 forward->work_counter = DNSSEC_WORK;
613ad15d
SK
349 if (do_bit)
350 forward->flags |= FREC_DO_QUESTION;
7fa836e1 351#endif
613ad15d 352
28866e95
SK
353 header->id = htons(forward->new_id);
354
8ef5ada2
SK
355 /* In strict_order mode, always try servers in the order
356 specified in resolv.conf, if a domain is given
357 always try all the available servers,
9e4abcb5
SK
358 otherwise, use the one last known to work. */
359
8ef5ada2
SK
360 if (type == 0)
361 {
28866e95 362 if (option_bool(OPT_ORDER))
8ef5ada2
SK
363 start = daemon->servers;
364 else if (!(start = daemon->last_server) ||
365 daemon->forwardcount++ > FORWARD_TEST ||
366 difftime(now, daemon->forwardtime) > FORWARD_TIME)
367 {
368 start = daemon->servers;
369 forward->forwardall = 1;
370 daemon->forwardcount = 0;
371 daemon->forwardtime = now;
372 }
373 }
374 else
de37951c 375 {
3be34541 376 start = daemon->servers;
28866e95 377 if (!option_bool(OPT_ORDER))
8ef5ada2 378 forward->forwardall = 1;
de37951c 379 }
9e4abcb5
SK
380 }
381 }
feba5c1d 382
9e4abcb5
SK
383 /* check for send errors here (no route to host)
384 if we fail to send to all nameservers, send back an error
385 packet straight away (helps modem users when offline) */
386
387 if (!flags && forward)
388 {
de37951c
SK
389 struct server *firstsentto = start;
390 int forwarded = 0;
28866e95 391
797a7afb 392 if (option_bool(OPT_ADD_MAC))
60b68069 393 plen = add_mac(header, plen, ((char *) header) + daemon->packet_buff_sz, &forward->source);
28866e95 394
ed4c0767
SK
395 if (option_bool(OPT_CLIENT_SUBNET))
396 {
60b68069 397 size_t new = add_source_addr(header, plen, ((char *) header) + daemon->packet_buff_sz, &forward->source);
ed4c0767
SK
398 if (new != plen)
399 {
400 plen = new;
401 forward->flags |= FREC_HAS_SUBNET;
402 }
403 }
404
3a237152
SK
405#ifdef HAVE_DNSSEC
406 if (option_bool(OPT_DNSSEC_VALID))
0fc2f313 407 {
613ad15d
SK
408 size_t new_plen = add_do_bit(header, plen, ((char *) header) + daemon->packet_buff_sz);
409
5b3bf921
SK
410 /* For debugging, set Checking Disabled, otherwise, have the upstream check too,
411 this allows it to select auth servers when one is returning bad data. */
412 if (option_bool(OPT_DNSSEC_DEBUG))
413 header->hb4 |= HB4_CD;
613ad15d
SK
414
415 if (new_plen != plen)
416 forward->flags |= FREC_ADDED_PHEADER;
417
418 plen = new_plen;
0fc2f313 419 }
3a237152
SK
420#endif
421
9e4abcb5
SK
422 while (1)
423 {
9e4abcb5
SK
424 /* only send to servers dealing with our domain.
425 domain may be NULL, in which case server->domain
426 must be NULL also. */
427
de37951c 428 if (type == (start->flags & SERV_TYPE) &&
fd9fa481
SK
429 (type != SERV_HAS_DOMAIN || hostname_isequal(domain, start->domain)) &&
430 !(start->flags & SERV_LITERAL_ADDRESS))
9e4abcb5 431 {
1a6bca81
SK
432 int fd;
433
434 /* find server socket to use, may need to get random one. */
435 if (start->sfd)
436 fd = start->sfd->fd;
437 else
438 {
439#ifdef HAVE_IPV6
440 if (start->addr.sa.sa_family == AF_INET6)
441 {
442 if (!forward->rfd6 &&
443 !(forward->rfd6 = allocate_rfd(AF_INET6)))
444 break;
3927da46 445 daemon->rfd_save = forward->rfd6;
1a6bca81
SK
446 fd = forward->rfd6->fd;
447 }
448 else
449#endif
450 {
451 if (!forward->rfd4 &&
452 !(forward->rfd4 = allocate_rfd(AF_INET)))
453 break;
3927da46 454 daemon->rfd_save = forward->rfd4;
1a6bca81
SK
455 fd = forward->rfd4->fd;
456 }
7de060b0
SK
457
458#ifdef HAVE_CONNTRACK
459 /* Copy connection mark of incoming query to outgoing connection. */
460 if (option_bool(OPT_CONNTRACK))
461 {
462 unsigned int mark;
797a7afb 463 if (get_incoming_mark(&forward->source, &forward->dest, 0, &mark))
7de060b0
SK
464 setsockopt(fd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
465 }
466#endif
1a6bca81
SK
467 }
468
469 if (sendto(fd, (char *)header, plen, 0,
feba5c1d 470 &start->addr.sa,
fd9fa481
SK
471 sa_len(&start->addr)) == -1)
472 {
473 if (retry_send())
474 continue;
475 }
476 else
9e4abcb5 477 {
cdeda28f
SK
478 /* Keep info in case we want to re-send this packet */
479 daemon->srv_save = start;
480 daemon->packet_len = plen;
481
de37951c 482 if (!gotname)
3be34541 483 strcpy(daemon->namebuff, "query");
de37951c 484 if (start->addr.sa.sa_family == AF_INET)
3be34541 485 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
1a6bca81 486 (struct all_addr *)&start->addr.in.sin_addr, NULL);
de37951c
SK
487#ifdef HAVE_IPV6
488 else
3be34541 489 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
1a6bca81 490 (struct all_addr *)&start->addr.in6.sin6_addr, NULL);
de37951c 491#endif
824af85b 492 start->queries++;
de37951c
SK
493 forwarded = 1;
494 forward->sentto = start;
0a852541 495 if (!forward->forwardall)
de37951c 496 break;
0a852541 497 forward->forwardall++;
9e4abcb5
SK
498 }
499 }
500
de37951c 501 if (!(start = start->next))
3be34541 502 start = daemon->servers;
9e4abcb5 503
de37951c 504 if (start == firstsentto)
9e4abcb5
SK
505 break;
506 }
507
de37951c 508 if (forwarded)
824af85b 509 return 1;
de37951c 510
9e4abcb5
SK
511 /* could not send on, prepare to return */
512 header->id = htons(forward->orig_id);
1a6bca81 513 free_frec(forward); /* cancel */
9e4abcb5
SK
514 }
515
516 /* could not send on, return empty answer or address if known for whole domain */
b8187c80
SK
517 if (udpfd != -1)
518 {
cdeda28f 519 plen = setup_reply(header, plen, addrp, flags, daemon->local_ttl);
54dd393f 520 send_from(udpfd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND), (char *)header, plen, udpaddr, dst_addr, dst_iface);
b8187c80
SK
521 }
522
824af85b 523 return 0;
9e4abcb5
SK
524}
525
ed4c0767 526static size_t process_reply(struct dns_header *header, time_t now, struct server *server, size_t n, int check_rebind,
613ad15d 527 int no_cache, int cache_secure, int ad_reqd, int do_bit, int added_pheader, int check_subnet, union mysockaddr *query_source)
feba5c1d 528{
36717eee 529 unsigned char *pheader, *sizep;
13d86c73 530 char **sets = 0;
832af0ba 531 int munged = 0, is_sign;
cdeda28f
SK
532 size_t plen;
533
83349b8a 534 (void)ad_reqd;
00a5b5d4 535 (void) do_bit;
83349b8a 536
13d86c73
JD
537#ifdef HAVE_IPSET
538 /* Similar algorithm to search_servers. */
539 struct ipsets *ipset_pos;
540 unsigned int namelen = strlen(daemon->namebuff);
541 unsigned int matchlen = 0;
542 for (ipset_pos = daemon->ipsets; ipset_pos; ipset_pos = ipset_pos->next)
543 {
544 unsigned int domainlen = strlen(ipset_pos->domain);
545 char *matchstart = daemon->namebuff + namelen - domainlen;
546 if (namelen >= domainlen && hostname_isequal(matchstart, ipset_pos->domain) &&
547 (domainlen == 0 || namelen == domainlen || *(matchstart - 1) == '.' ) &&
6c0cb858
SK
548 domainlen >= matchlen)
549 {
550 matchlen = domainlen;
551 sets = ipset_pos->sets;
552 }
13d86c73
JD
553 }
554#endif
555
feba5c1d 556 /* If upstream is advertising a larger UDP packet size
9009d746
SK
557 than we allow, trim it so that we don't get overlarge
558 requests for the client. We can't do this for signed packets. */
feba5c1d 559
ed4c0767 560 if ((pheader = find_pseudoheader(header, n, &plen, &sizep, &is_sign)))
feba5c1d 561 {
83349b8a
SK
562 unsigned short udpsz;
563 unsigned char *psave = sizep;
564
565 GETSHORT(udpsz, sizep);
566
567 if (!is_sign && udpsz > daemon->edns_pktsz)
568 PUTSHORT(daemon->edns_pktsz, psave);
feba5c1d 569
ed4c0767
SK
570 if (check_subnet && !check_source(header, plen, pheader, query_source))
571 {
572 my_syslog(LOG_WARNING, _("discarding DNS reply: subnet option mismatch"));
573 return 0;
574 }
613ad15d
SK
575
576 if (added_pheader)
577 {
578 pheader = 0;
579 header->arcount = htons(0);
580 }
feba5c1d 581 }
83349b8a 582
28866e95 583 /* RFC 4035 sect 4.6 para 3 */
237724c0 584 if (!is_sign && !option_bool(OPT_DNSSEC_PROXY))
795501bc 585 header->hb4 &= ~HB4_AD;
3a237152 586
572b41eb 587 if (OPCODE(header) != QUERY || (RCODE(header) != NOERROR && RCODE(header) != NXDOMAIN))
0a852541
SK
588 return n;
589
feba5c1d 590 /* Complain loudly if the upstream server is non-recursive. */
572b41eb 591 if (!(header->hb4 & HB4_RA) && RCODE(header) == NOERROR && ntohs(header->ancount) == 0 &&
0a852541 592 server && !(server->flags & SERV_WARNED_RECURSIVE))
feba5c1d 593 {
3d8df260 594 prettyprint_addr(&server->addr, daemon->namebuff);
f2621c7f 595 my_syslog(LOG_WARNING, _("nameserver %s refused to do a recursive query"), daemon->namebuff);
28866e95 596 if (!option_bool(OPT_LOG))
0a852541
SK
597 server->flags |= SERV_WARNED_RECURSIVE;
598 }
e292e93d 599
572b41eb 600 if (daemon->bogus_addr && RCODE(header) != NXDOMAIN &&
fd9fa481 601 check_for_bogus_wildcard(header, n, daemon->namebuff, daemon->bogus_addr, now))
feba5c1d 602 {
fd9fa481 603 munged = 1;
572b41eb
SK
604 SET_RCODE(header, NXDOMAIN);
605 header->hb3 &= ~HB3_AA;
6938f347 606 cache_secure = 0;
36717eee 607 }
fd9fa481 608 else
36717eee 609 {
6938f347
SK
610 int doctored = 0;
611
572b41eb 612 if (RCODE(header) == NXDOMAIN &&
fd9fa481 613 extract_request(header, n, daemon->namebuff, NULL) &&
5aabfc78 614 check_for_local_domain(daemon->namebuff, now))
36717eee
SK
615 {
616 /* if we forwarded a query for a locally known name (because it was for
617 an unknown type) and the answer is NXDOMAIN, convert that to NODATA,
618 since we know that the domain exists, even if upstream doesn't */
fd9fa481 619 munged = 1;
572b41eb
SK
620 header->hb3 |= HB3_AA;
621 SET_RCODE(header, NOERROR);
6938f347 622 cache_secure = 0;
feba5c1d 623 }
832af0ba 624
6938f347 625 if (extract_addresses(header, n, daemon->namebuff, now, sets, is_sign, check_rebind, no_cache, cache_secure, &doctored))
824af85b 626 {
8ef5ada2 627 my_syslog(LOG_WARNING, _("possible DNS-rebind attack detected: %s"), daemon->namebuff);
824af85b 628 munged = 1;
6938f347 629 cache_secure = 0;
824af85b 630 }
6938f347
SK
631
632 if (doctored)
633 cache_secure = 0;
feba5c1d 634 }
fd9fa481 635
a25720a3
SK
636#ifdef HAVE_DNSSEC
637 if (no_cache && !(header->hb4 & HB4_CD))
638 {
7d23a66f 639 if (!option_bool(OPT_DNSSEC_DEBUG))
a25720a3
SK
640 {
641 /* Bogus reply, turn into SERVFAIL */
642 SET_RCODE(header, SERVFAIL);
643 munged = 1;
644 }
645 }
6938f347
SK
646
647 if (option_bool(OPT_DNSSEC_VALID))
648 header->hb4 &= ~HB4_AD;
649
83349b8a 650 if (!(header->hb4 & HB4_CD) && ad_reqd && cache_secure)
6938f347 651 header->hb4 |= HB4_AD;
613ad15d
SK
652
653 /* If the requestor didn't set the DO bit, don't return DNSSEC info. */
654 if (!do_bit)
655 n = filter_rrsigs(header, n);
a25720a3
SK
656#endif
657
fd9fa481
SK
658 /* do this after extract_addresses. Ensure NODATA reply and remove
659 nameserver info. */
660
661 if (munged)
662 {
663 header->ancount = htons(0);
664 header->nscount = htons(0);
665 header->arcount = htons(0);
666 }
667
36717eee
SK
668 /* the bogus-nxdomain stuff, doctor and NXDOMAIN->NODATA munging can all elide
669 sections of the packet. Find the new length here and put back pseudoheader
670 if it was removed. */
671 return resize_packet(header, n, pheader, plen);
feba5c1d
SK
672}
673
3be34541 674/* sets new last_server */
1a6bca81 675void reply_query(int fd, int family, time_t now)
9e4abcb5
SK
676{
677 /* packet from peer server, extract data for cache, and send to
678 original requester */
572b41eb 679 struct dns_header *header;
de37951c 680 union mysockaddr serveraddr;
832af0ba 681 struct frec *forward;
de37951c 682 socklen_t addrlen = sizeof(serveraddr);
60b68069 683 ssize_t n = recvfrom(fd, daemon->packet, daemon->packet_buff_sz, 0, &serveraddr.sa, &addrlen);
cdeda28f 684 size_t nn;
1a6bca81 685 struct server *server;
8a9be9e4
SK
686 void *hash;
687#ifndef HAVE_DNSSEC
688 unsigned int crc;
689#endif
690
cdeda28f
SK
691 /* packet buffer overwritten */
692 daemon->srv_save = NULL;
832af0ba 693
de37951c 694 /* Determine the address of the server replying so that we can mark that as good */
1a6bca81 695 serveraddr.sa.sa_family = family;
de37951c
SK
696#ifdef HAVE_IPV6
697 if (serveraddr.sa.sa_family == AF_INET6)
5e9e0efb 698 serveraddr.in6.sin6_flowinfo = 0;
de37951c 699#endif
9e4abcb5 700
490f9075
SK
701 header = (struct dns_header *)daemon->packet;
702
703 if (n < (int)sizeof(struct dns_header) || !(header->hb3 & HB3_QR))
704 return;
705
1a6bca81
SK
706 /* spoof check: answer must come from known server, */
707 for (server = daemon->servers; server; server = server->next)
708 if (!(server->flags & (SERV_LITERAL_ADDRESS | SERV_NO_ADDR)) &&
709 sockaddr_isequal(&server->addr, &serveraddr))
710 break;
490f9075
SK
711
712 if (!server)
713 return;
714
8a9be9e4
SK
715#ifdef HAVE_DNSSEC
716 hash = hash_questions(header, n, daemon->namebuff);
717#else
718 hash = &crc;
719 crc = questions_crc(header, n, daemon->namebuff);
720#endif
fd9fa481 721
490f9075 722 if (!(forward = lookup_frec(ntohs(header->id), hash)))
1a6bca81 723 return;
490f9075 724
572b41eb 725 if ((RCODE(header) == SERVFAIL || RCODE(header) == REFUSED) &&
28866e95 726 !option_bool(OPT_ORDER) &&
1a6bca81
SK
727 forward->forwardall == 0)
728 /* for broken servers, attempt to send to another one. */
9e4abcb5 729 {
1a6bca81
SK
730 unsigned char *pheader;
731 size_t plen;
732 int is_sign;
832af0ba 733
1a6bca81
SK
734 /* recreate query from reply */
735 pheader = find_pseudoheader(header, (size_t)n, &plen, NULL, &is_sign);
736 if (!is_sign)
832af0ba 737 {
1a6bca81
SK
738 header->ancount = htons(0);
739 header->nscount = htons(0);
740 header->arcount = htons(0);
741 if ((nn = resize_packet(header, (size_t)n, pheader, plen)))
832af0ba 742 {
572b41eb 743 header->hb3 &= ~(HB3_QR | HB3_TC);
613ad15d 744 forward_query(-1, NULL, NULL, 0, header, nn, now, forward, 0, 0);
1a6bca81 745 return;
832af0ba 746 }
832af0ba 747 }
1a6bca81 748 }
3a237152
SK
749
750 server = forward->sentto;
1a6bca81
SK
751
752 if ((forward->sentto->flags & SERV_TYPE) == 0)
753 {
51967f98 754 if (RCODE(header) == REFUSED)
1a6bca81
SK
755 server = NULL;
756 else
b8187c80 757 {
1a6bca81
SK
758 struct server *last_server;
759
760 /* find good server by address if possible, otherwise assume the last one we sent to */
761 for (last_server = daemon->servers; last_server; last_server = last_server->next)
762 if (!(last_server->flags & (SERV_LITERAL_ADDRESS | SERV_HAS_DOMAIN | SERV_FOR_NODOTS | SERV_NO_ADDR)) &&
763 sockaddr_isequal(&last_server->addr, &serveraddr))
764 {
765 server = last_server;
766 break;
767 }
768 }
28866e95 769 if (!option_bool(OPT_ALL_SERVERS))
1a6bca81
SK
770 daemon->last_server = server;
771 }
3a237152 772
1a6bca81
SK
773 /* If the answer is an error, keep the forward record in place in case
774 we get a good reply from another server. Kill it when we've
775 had replies from all to avoid filling the forwarding table when
776 everything is broken */
51967f98 777 if (forward->forwardall == 0 || --forward->forwardall == 1 || RCODE(header) != SERVFAIL)
1a6bca81 778 {
3a237152
SK
779 int check_rebind = 0, no_cache_dnssec = 0, cache_secure = 0;
780
781 if (option_bool(OPT_NO_REBIND))
782 check_rebind = !(forward->flags & FREC_NOREBIND);
783
784 /* Don't cache replies where DNSSEC validation was turned off, either
785 the upstream server told us so, or the original query specified it. */
786 if ((header->hb4 & HB4_CD) || (forward->flags & FREC_CHECKING_DISABLED))
787 no_cache_dnssec = 1;
788
789#ifdef HAVE_DNSSEC
51967f98 790 if (server && option_bool(OPT_DNSSEC_VALID) && !(forward->flags & FREC_CHECKING_DISABLED))
3a237152 791 {
9d633048 792 int status;
0fc2f313
SK
793
794 /* We've had a reply already, which we're validating. Ignore this duplicate */
e0c0ad3b 795 if (forward->blocking_query)
0fc2f313 796 return;
9d633048 797
871417d4
SK
798 if (header->hb3 & HB3_TC)
799 {
800 /* Truncated answer can't be validated.
5d3b87a4
SK
801 If this is an answer to a DNSSEC-generated query, we still
802 need to get the client to retry over TCP, so return
803 an answer with the TC bit set, even if the actual answer fits.
804 */
805 status = STAT_TRUNCATED;
871417d4
SK
806 }
807 else if (forward->flags & FREC_DNSKEY_QUERY)
8d718cbb 808 status = dnssec_validate_by_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
c3e0b9b6 809 else if (forward->flags & FREC_DS_QUERY)
00a5b5d4
SK
810 {
811 status = dnssec_validate_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
812 if (status == STAT_NO_DS)
813 status = STAT_INSECURE;
814 }
815 else if (forward->flags & FREC_CHECK_NOSIGN)
816 status = do_check_sign(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
9d633048 817 else
00a5b5d4
SK
818 {
819 status = dnssec_validate_reply(now, header, n, daemon->namebuff, daemon->keyname, &forward->class, NULL);
820 if (status == STAT_NO_SIG)
821 {
822 if (option_bool(OPT_DNSSEC_NO_SIGN))
823 status = send_check_sign(now, header, n, daemon->namebuff, daemon->keyname);
824 else
825 status = STAT_INSECURE;
826 }
827 }
3a237152
SK
828 /* Can't validate, as we're missing key data. Put this
829 answer aside, whilst we get that. */
00a5b5d4 830 if (status == STAT_NEED_DS || status == STAT_NEED_DS_NEG || status == STAT_NEED_KEY)
3a237152 831 {
7fa836e1
SK
832 struct frec *new, *orig;
833
834 /* Free any saved query */
835 if (forward->stash)
836 blockdata_free(forward->stash);
837
838 /* Now save reply pending receipt of key data */
839 if (!(forward->stash = blockdata_alloc((char *)header, n)))
840 return;
841 forward->stash_len = n;
0fc2f313 842
7fa836e1
SK
843 anotherkey:
844 /* Find the original query that started it all.... */
845 for (orig = forward; orig->dependent; orig = orig->dependent);
846
847 if (--orig->work_counter == 0 || !(new = get_new_frec(now, NULL, 1)))
848 status = STAT_INSECURE;
849 else
3a237152 850 {
7fa836e1 851 int fd;
0fc2f313
SK
852 struct frec *next = new->next;
853 *new = *forward; /* copy everything, then overwrite */
854 new->next = next;
0fc2f313 855 new->blocking_query = NULL;
f1668d27
SK
856 new->rfd4 = NULL;
857#ifdef HAVE_IPV6
858 new->rfd6 = NULL;
859#endif
00a5b5d4 860 new->flags &= ~(FREC_DNSKEY_QUERY | FREC_DS_QUERY | FREC_CHECK_NOSIGN);
9d633048 861
7fa836e1
SK
862 new->dependent = forward; /* to find query awaiting new one. */
863 forward->blocking_query = new; /* for garbage cleaning */
864 /* validate routines leave name of required record in daemon->keyname */
865 if (status == STAT_NEED_KEY)
866 {
867 new->flags |= FREC_DNSKEY_QUERY;
868 nn = dnssec_generate_query(header, ((char *) header) + daemon->packet_buff_sz,
869 daemon->keyname, forward->class, T_DNSKEY, &server->addr);
870 }
871 else
872 {
00a5b5d4
SK
873 if (status == STAT_NEED_DS_NEG)
874 new->flags |= FREC_CHECK_NOSIGN;
875 else
876 new->flags |= FREC_DS_QUERY;
7fa836e1
SK
877 nn = dnssec_generate_query(header,((char *) header) + daemon->packet_buff_sz,
878 daemon->keyname, forward->class, T_DS, &server->addr);
879 }
880 if ((hash = hash_questions(header, nn, daemon->namebuff)))
881 memcpy(new->hash, hash, HASH_SIZE);
882 new->new_id = get_id();
883 header->id = htons(new->new_id);
884 /* Save query for retransmission */
885 new->stash = blockdata_alloc((char *)header, nn);
886 new->stash_len = nn;
887
888 /* Don't resend this. */
889 daemon->srv_save = NULL;
e0c0ad3b 890
7fa836e1
SK
891 if (server->sfd)
892 fd = server->sfd->fd;
e0c0ad3b 893 else
3a237152 894 {
7fa836e1
SK
895 fd = -1;
896#ifdef HAVE_IPV6
897 if (server->addr.sa.sa_family == AF_INET6)
9d633048 898 {
7fa836e1
SK
899 if (new->rfd6 || (new->rfd6 = allocate_rfd(AF_INET6)))
900 fd = new->rfd6->fd;
9d633048 901 }
3a237152 902 else
3a237152 903#endif
f1668d27 904 {
7fa836e1
SK
905 if (new->rfd4 || (new->rfd4 = allocate_rfd(AF_INET)))
906 fd = new->rfd4->fd;
f1668d27 907 }
3a237152 908 }
7fa836e1
SK
909
910 if (fd != -1)
911 {
912 while (sendto(fd, (char *)header, nn, 0, &server->addr.sa, sa_len(&server->addr)) == -1 && retry_send());
913 server->queries++;
914 }
915
916 return;
3a237152 917 }
3a237152
SK
918 }
919
920 /* Ok, we reached far enough up the chain-of-trust that we can validate something.
921 Now wind back down, pulling back answers which wouldn't previously validate
7fa836e1
SK
922 and validate them with the new data. Note that if an answer needs multiple
923 keys to validate, we may find another key is needed, in which case we set off
924 down another branch of the tree. Once we get to the original answer
925 (FREC_DNSSEC_QUERY not set) and it validates, return it to the original requestor. */
0744ca66 926 while (forward->dependent)
3a237152 927 {
0744ca66
SK
928 struct frec *prev = forward->dependent;
929 free_frec(forward);
930 forward = prev;
931 forward->blocking_query = NULL; /* already gone */
932 blockdata_retrieve(forward->stash, forward->stash_len, (void *)header);
933 n = forward->stash_len;
934
935 if (status == STAT_SECURE)
3a237152 936 {
0744ca66
SK
937 if (forward->flags & FREC_DNSKEY_QUERY)
938 status = dnssec_validate_by_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
939 else if (forward->flags & FREC_DS_QUERY)
00a5b5d4
SK
940 {
941 status = dnssec_validate_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
942 if (status == STAT_NO_DS)
943 status = STAT_INSECURE;
944 }
945 else if (forward->flags & FREC_CHECK_NOSIGN)
946 status = do_check_sign(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
0744ca66 947 else
00a5b5d4
SK
948 {
949 status = dnssec_validate_reply(now, header, n, daemon->namebuff, daemon->keyname, &forward->class, NULL);
950 if (status == STAT_NO_SIG)
951 {
952 if (option_bool(OPT_DNSSEC_NO_SIGN))
953 status = send_check_sign(now, header, n, daemon->namebuff, daemon->keyname);
954 else
955 status = STAT_INSECURE;
956 }
957 }
958
959 if (status == STAT_NEED_DS || status == STAT_NEED_DS_NEG || status == STAT_NEED_KEY)
7fa836e1 960 goto anotherkey;
3a237152
SK
961 }
962 }
5d3b87a4
SK
963
964 if (status == STAT_TRUNCATED)
0744ca66 965 header->hb3 |= HB3_TC;
5d3b87a4 966 else
7fa836e1
SK
967 {
968 char *result;
969
970 if (forward->work_counter == 0)
971 result = "ABANDONED";
972 else
973 result = (status == STAT_SECURE ? "SECURE" : (status == STAT_INSECURE ? "INSECURE" : "BOGUS"));
974
975 log_query(F_KEYTAG | F_SECSTAT, "result", NULL, result);
976 }
5d3b87a4 977
0fc2f313 978 no_cache_dnssec = 0;
5d3b87a4 979
3a237152
SK
980 if (status == STAT_SECURE)
981 cache_secure = 1;
3a237152
SK
982 else if (status == STAT_BOGUS)
983 no_cache_dnssec = 1;
984 }
83349b8a
SK
985#endif
986
987 /* restore CD bit to the value in the query */
988 if (forward->flags & FREC_CHECKING_DISABLED)
989 header->hb4 |= HB4_CD;
990 else
991 header->hb4 &= ~HB4_CD;
8ef5ada2 992
3a237152 993 if ((nn = process_reply(header, now, server, (size_t)n, check_rebind, no_cache_dnssec, cache_secure,
613ad15d
SK
994 forward->flags & FREC_AD_QUESTION, forward->flags & FREC_DO_QUESTION,
995 forward->flags & FREC_ADDED_PHEADER, forward->flags & FREC_HAS_SUBNET, &forward->source)))
1a6bca81
SK
996 {
997 header->id = htons(forward->orig_id);
572b41eb 998 header->hb4 |= HB4_RA; /* recursion if available */
54dd393f 999 send_from(forward->fd, option_bool(OPT_NOWILD) || option_bool (OPT_CLEVERBIND), daemon->packet, nn,
50303b19 1000 &forward->source, &forward->dest, forward->iface);
b8187c80 1001 }
1a6bca81 1002 free_frec(forward); /* cancel */
9e4abcb5 1003 }
9e4abcb5 1004}
44a2a316 1005
1a6bca81 1006
5aabfc78 1007void receive_query(struct listener *listen, time_t now)
44a2a316 1008{
572b41eb 1009 struct dns_header *header = (struct dns_header *)daemon->packet;
44a2a316 1010 union mysockaddr source_addr;
c1bb8504 1011 unsigned short type;
44a2a316 1012 struct all_addr dst_addr;
f6b7dc47 1013 struct in_addr netmask, dst_addr_4;
cdeda28f
SK
1014 size_t m;
1015 ssize_t n;
3b195961
VG
1016 int if_index = 0, auth_dns = 0;
1017#ifdef HAVE_AUTH
1018 int local_auth = 0;
1019#endif
44a2a316
SK
1020 struct iovec iov[1];
1021 struct msghdr msg;
1022 struct cmsghdr *cmptr;
44a2a316
SK
1023 union {
1024 struct cmsghdr align; /* this ensures alignment */
1025#ifdef HAVE_IPV6
1026 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
1027#endif
5e9e0efb 1028#if defined(HAVE_LINUX_NETWORK)
44a2a316 1029 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
824af85b
SK
1030#elif defined(IP_RECVDSTADDR) && defined(HAVE_SOLARIS_NETWORK)
1031 char control[CMSG_SPACE(sizeof(struct in_addr)) +
1032 CMSG_SPACE(sizeof(unsigned int))];
44a2a316
SK
1033#elif defined(IP_RECVDSTADDR)
1034 char control[CMSG_SPACE(sizeof(struct in_addr)) +
1035 CMSG_SPACE(sizeof(struct sockaddr_dl))];
1036#endif
1037 } control_u;
2329bef5
SK
1038#ifdef HAVE_IPV6
1039 /* Can always get recvd interface for IPv6 */
1040 int check_dst = !option_bool(OPT_NOWILD) || listen->family == AF_INET6;
1041#else
1042 int check_dst = !option_bool(OPT_NOWILD);
1043#endif
1044
cdeda28f
SK
1045 /* packet buffer overwritten */
1046 daemon->srv_save = NULL;
1047
4f7b304f
SK
1048 dst_addr_4.s_addr = 0;
1049 netmask.s_addr = 0;
1050
7e5664bd 1051 if (option_bool(OPT_NOWILD) && listen->iface)
3d8df260 1052 {
4f7b304f
SK
1053 auth_dns = listen->iface->dns_auth;
1054
1055 if (listen->family == AF_INET)
1056 {
1057 dst_addr_4 = listen->iface->addr.in.sin_addr;
1058 netmask = listen->iface->netmask;
1059 }
3d8df260 1060 }
4f7b304f 1061
3be34541
SK
1062 iov[0].iov_base = daemon->packet;
1063 iov[0].iov_len = daemon->edns_pktsz;
44a2a316
SK
1064
1065 msg.msg_control = control_u.control;
1066 msg.msg_controllen = sizeof(control_u);
1067 msg.msg_flags = 0;
1068 msg.msg_name = &source_addr;
1069 msg.msg_namelen = sizeof(source_addr);
1070 msg.msg_iov = iov;
1071 msg.msg_iovlen = 1;
1072
de37951c 1073 if ((n = recvmsg(listen->fd, &msg, 0)) == -1)
3be34541 1074 return;
44a2a316 1075
572b41eb 1076 if (n < (int)sizeof(struct dns_header) ||
5e9e0efb 1077 (msg.msg_flags & MSG_TRUNC) ||
572b41eb 1078 (header->hb3 & HB3_QR))
26128d27
SK
1079 return;
1080
44a2a316 1081 source_addr.sa.sa_family = listen->family;
2a7a2b84
SK
1082
1083 if (listen->family == AF_INET)
1084 {
1085 /* Source-port == 0 is an error, we can't send back to that.
1086 http://www.ietf.org/mail-archive/web/dnsop/current/msg11441.html */
1087 if (source_addr.in.sin_port == 0)
1088 return;
1089 }
44a2a316 1090#ifdef HAVE_IPV6
2a7a2b84
SK
1091 else
1092 {
1093 /* Source-port == 0 is an error, we can't send back to that. */
1094 if (source_addr.in6.sin6_port == 0)
1095 return;
1096 source_addr.in6.sin6_flowinfo = 0;
1097 }
44a2a316 1098#endif
2a7a2b84 1099
c8a80487
SK
1100 /* We can be configured to only accept queries from at-most-one-hop-away addresses. */
1101 if (option_bool(OPT_LOCAL_SERVICE))
1102 {
1103 struct addrlist *addr;
1104#ifdef HAVE_IPV6
1105 if (listen->family == AF_INET6)
1106 {
1107 for (addr = daemon->interface_addrs; addr; addr = addr->next)
1108 if ((addr->flags & ADDRLIST_IPV6) &&
1109 is_same_net6(&addr->addr.addr.addr6, &source_addr.in6.sin6_addr, addr->prefixlen))
1110 break;
1111 }
1112 else
1113#endif
1114 {
1115 struct in_addr netmask;
1116 for (addr = daemon->interface_addrs; addr; addr = addr->next)
1117 {
1118 netmask.s_addr = 0xffffffff << (32 - addr->prefixlen);
1119 if (!(addr->flags & ADDRLIST_IPV6) &&
1120 is_same_net(addr->addr.addr.addr4, source_addr.in.sin_addr, netmask))
1121 break;
1122 }
1123 }
1124 if (!addr)
1125 {
0c8584ea
SK
1126 static int warned = 0;
1127 if (!warned)
1128 {
1129 my_syslog(LOG_WARNING, _("Ignoring query from non-local network"));
1130 warned = 1;
1131 }
c8a80487
SK
1132 return;
1133 }
1134 }
1135
2329bef5 1136 if (check_dst)
26128d27
SK
1137 {
1138 struct ifreq ifr;
1139
1140 if (msg.msg_controllen < sizeof(struct cmsghdr))
1141 return;
44a2a316 1142
5e9e0efb 1143#if defined(HAVE_LINUX_NETWORK)
26128d27
SK
1144 if (listen->family == AF_INET)
1145 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
c72daea8 1146 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_PKTINFO)
26128d27 1147 {
8ef5ada2
SK
1148 union {
1149 unsigned char *c;
1150 struct in_pktinfo *p;
1151 } p;
1152 p.c = CMSG_DATA(cmptr);
1153 dst_addr_4 = dst_addr.addr.addr4 = p.p->ipi_spec_dst;
1154 if_index = p.p->ipi_ifindex;
26128d27
SK
1155 }
1156#elif defined(IP_RECVDSTADDR) && defined(IP_RECVIF)
1157 if (listen->family == AF_INET)
44a2a316 1158 {
26128d27 1159 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
8ef5ada2
SK
1160 {
1161 union {
1162 unsigned char *c;
1163 unsigned int *i;
1164 struct in_addr *a;
1165#ifndef HAVE_SOLARIS_NETWORK
1166 struct sockaddr_dl *s;
1167#endif
1168 } p;
1169 p.c = CMSG_DATA(cmptr);
1170 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVDSTADDR)
1171 dst_addr_4 = dst_addr.addr.addr4 = *(p.a);
1172 else if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVIF)
824af85b 1173#ifdef HAVE_SOLARIS_NETWORK
8ef5ada2 1174 if_index = *(p.i);
824af85b 1175#else
8ef5ada2 1176 if_index = p.s->sdl_index;
824af85b 1177#endif
8ef5ada2 1178 }
44a2a316 1179 }
44a2a316 1180#endif
26128d27 1181
44a2a316 1182#ifdef HAVE_IPV6
26128d27
SK
1183 if (listen->family == AF_INET6)
1184 {
1185 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
c72daea8 1186 if (cmptr->cmsg_level == IPPROTO_IPV6 && cmptr->cmsg_type == daemon->v6pktinfo)
26128d27 1187 {
8ef5ada2
SK
1188 union {
1189 unsigned char *c;
1190 struct in6_pktinfo *p;
1191 } p;
1192 p.c = CMSG_DATA(cmptr);
1193
1194 dst_addr.addr.addr6 = p.p->ipi6_addr;
1195 if_index = p.p->ipi6_ifindex;
26128d27
SK
1196 }
1197 }
44a2a316 1198#endif
26128d27
SK
1199
1200 /* enforce available interface configuration */
1201
e25db1f2 1202 if (!indextoname(listen->fd, if_index, ifr.ifr_name))
5e9e0efb 1203 return;
832af0ba 1204
e25db1f2
SK
1205 if (!iface_check(listen->family, &dst_addr, ifr.ifr_name, &auth_dns))
1206 {
1207 if (!option_bool(OPT_CLEVERBIND))
115ac3e4 1208 enumerate_interfaces(0);
3f2873d4
SK
1209 if (!loopback_exception(listen->fd, listen->family, &dst_addr, ifr.ifr_name) &&
1210 !label_exception(if_index, listen->family, &dst_addr))
e25db1f2
SK
1211 return;
1212 }
1213
552af8b9
SK
1214 if (listen->family == AF_INET && option_bool(OPT_LOCALISE))
1215 {
1216 struct irec *iface;
1217
1218 /* get the netmask of the interface whch has the address we were sent to.
1219 This is no neccessarily the interface we arrived on. */
1220
1221 for (iface = daemon->interfaces; iface; iface = iface->next)
1222 if (iface->addr.sa.sa_family == AF_INET &&
1223 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
1224 break;
1225
1226 /* interface may be new */
e25db1f2 1227 if (!iface && !option_bool(OPT_CLEVERBIND))
115ac3e4 1228 enumerate_interfaces(0);
552af8b9
SK
1229
1230 for (iface = daemon->interfaces; iface; iface = iface->next)
1231 if (iface->addr.sa.sa_family == AF_INET &&
1232 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
1233 break;
1234
1235 /* If we failed, abandon localisation */
1236 if (iface)
1237 netmask = iface->netmask;
1238 else
1239 dst_addr_4.s_addr = 0;
1240 }
44a2a316
SK
1241 }
1242
cdeda28f 1243 if (extract_request(header, (size_t)n, daemon->namebuff, &type))
44a2a316 1244 {
b485ed97
SK
1245#ifdef HAVE_AUTH
1246 struct auth_zone *zone;
1247#endif
610e782a
SK
1248 char *types = querystr(auth_dns ? "auth" : "query", type);
1249
44a2a316 1250 if (listen->family == AF_INET)
3be34541 1251 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
1a6bca81 1252 (struct all_addr *)&source_addr.in.sin_addr, types);
44a2a316
SK
1253#ifdef HAVE_IPV6
1254 else
3be34541 1255 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
1a6bca81 1256 (struct all_addr *)&source_addr.in6.sin6_addr, types);
44a2a316 1257#endif
44a2a316 1258
b485ed97
SK
1259#ifdef HAVE_AUTH
1260 /* find queries for zones we're authoritative for, and answer them directly */
6008bdbb
SK
1261 if (!auth_dns)
1262 for (zone = daemon->auth_zones; zone; zone = zone->next)
1263 if (in_zone(zone, daemon->namebuff, NULL))
1264 {
1265 auth_dns = 1;
1266 local_auth = 1;
1267 break;
1268 }
b485ed97
SK
1269#endif
1270 }
1271
4820dce9 1272#ifdef HAVE_AUTH
4f7b304f 1273 if (auth_dns)
824af85b 1274 {
60b68069 1275 m = answer_auth(header, ((char *) header) + daemon->packet_buff_sz, (size_t)n, now, &source_addr, local_auth);
4f7b304f 1276 if (m >= 1)
b485ed97
SK
1277 {
1278 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
1279 (char *)header, m, &source_addr, &dst_addr, if_index);
1280 daemon->auth_answer++;
1281 }
824af85b 1282 }
44a2a316 1283 else
4820dce9 1284#endif
4f7b304f 1285 {
613ad15d 1286 int ad_reqd, do_bit;
60b68069 1287 m = answer_request(header, ((char *) header) + daemon->packet_buff_sz, (size_t)n,
613ad15d 1288 dst_addr_4, netmask, now, &ad_reqd, &do_bit);
4f7b304f
SK
1289
1290 if (m >= 1)
1291 {
1292 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
1293 (char *)header, m, &source_addr, &dst_addr, if_index);
1294 daemon->local_answer++;
1295 }
1296 else if (forward_query(listen->fd, &source_addr, &dst_addr, if_index,
613ad15d 1297 header, (size_t)n, now, NULL, ad_reqd, do_bit))
4f7b304f
SK
1298 daemon->queries_forwarded++;
1299 else
1300 daemon->local_answer++;
1301 }
44a2a316
SK
1302}
1303
7d7b7b31 1304#ifdef HAVE_DNSSEC
00a5b5d4
SK
1305
1306/* UDP: we've got an unsigned answer, return STAT_INSECURE if we can prove there's no DS
1307 and therefore the answer shouldn't be signed, or STAT_BOGUS if it should be, or
1308 STAT_NEED_DS_NEG and keyname if we need to do the query. */
1309static int send_check_sign(time_t now, struct dns_header *header, size_t plen, char *name, char *keyname)
1310{
1311 struct crec *crecp;
1312 char *name_start = name;
1313 int status = dnssec_chase_cname(now, header, plen, name, keyname);
1314
1315 if (status != STAT_INSECURE)
1316 return status;
1317
1318 while (1)
1319 {
1320 crecp = cache_find_by_name(NULL, name_start, now, F_DS);
1321
1322 if (crecp && (crecp->flags & F_DNSSECOK))
1323 return (crecp->flags & F_NEG) ? STAT_INSECURE : STAT_BOGUS;
1324
1325 if (crecp && (crecp->flags & F_NEG) && (name_start = strchr(name_start, '.')))
1326 {
1327 name_start++; /* chop a label off and try again */
1328 continue;
1329 }
1330
1331 strcpy(keyname, name_start);
1332 return STAT_NEED_DS_NEG;
1333 }
1334}
1335
1336/* Got answer to DS query from send_check_sign, check for proven non-existence, or make the next DS query to try. */
1337static int do_check_sign(time_t now, struct dns_header *header, size_t plen, char *name, char *keyname, int class)
1338
1339{
1340 char *name_start;
1341 unsigned char *p;
1342 int status = dnssec_validate_ds(now, header, plen, name, keyname, class);
1343
1344 if (status != STAT_INSECURE)
1345 {
1346 if (status == STAT_NO_DS)
1347 status = STAT_INSECURE;
1348 return status;
1349 }
1350
1351 p = (unsigned char *)(header+1);
1352
1353 if (extract_name(header, plen, &p, name, 1, 4) &&
1354 (name_start = strchr(name, '.')))
1355 {
1356 name_start++; /* chop a label off and try again */
1357 strcpy(keyname, name_start);
1358 return STAT_NEED_DS_NEG;
1359 }
1360
1361 return STAT_BOGUS;
1362}
1363
1364/* Move toward the root, until we find a signed non-existance of a DS, in which case
1365 an unsigned answer is OK, or we find a signed DS, in which case there should be
1366 a signature, and the answer is BOGUS */
1367static int tcp_check_for_unsigned_zone(time_t now, struct dns_header *header, size_t plen, int class, char *name,
1368 char *keyname, struct server *server, int *keycount)
1369{
1370 size_t m;
1371 unsigned char *packet, *payload;
1372 u16 *length;
1373 unsigned char *p = (unsigned char *)(header+1);
1374 int status;
1375 char *name_start = name;
1376
1377 /* Get first insecure entry in CNAME chain */
1378 status = tcp_key_recurse(now, STAT_CHASE_CNAME, header, plen, class, name, keyname, server, keycount);
1379 if (status == STAT_BOGUS)
1380 return STAT_BOGUS;
1381
1382 if (!(packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16))))
1383 return STAT_BOGUS;
1384
1385 payload = &packet[2];
1386 header = (struct dns_header *)payload;
1387 length = (u16 *)packet;
1388
1389 while (1)
1390 {
1391 unsigned char *newhash, hash[HASH_SIZE];
1392 unsigned char c1, c2;
1393 struct crec *crecp = cache_find_by_name(NULL, name_start, now, F_DS);
1394
1395 if (--(*keycount) == 0)
fc2833f1
TH
1396 {
1397 free(packet);
1398 return STAT_BOGUS;
1399 }
1400
00a5b5d4
SK
1401 if (crecp && (crecp->flags & F_DNSSECOK))
1402 {
1403 free(packet);
1404 return (crecp->flags & F_NEG) ? STAT_INSECURE : STAT_BOGUS;
1405 }
1406
1407 /* If we have cached insecurely that a DS doesn't exist,
1408 ise that is a hit for where to start looking for the secure one */
1409 if (crecp && (crecp->flags & F_NEG) && (name_start = strchr(name_start, '.')))
1410 {
1411 name_start++; /* chop a label off and try again */
1412 continue;
1413 }
1414
1415 m = dnssec_generate_query(header, ((char *) header) + 65536, name_start, class, T_DS, &server->addr);
1416
1417 /* We rely on the question section coming back unchanged, ensure it is with the hash. */
1418 if ((newhash = hash_questions(header, (unsigned int)m, name)))
00a5b5d4 1419 {
b37f8b99
TH
1420 memcpy(hash, newhash, HASH_SIZE);
1421
1422 *length = htons(m);
00a5b5d4 1423
b37f8b99
TH
1424 if (read_write(server->tcpfd, packet, m + sizeof(u16), 0) &&
1425 read_write(server->tcpfd, &c1, 1, 1) &&
1426 read_write(server->tcpfd, &c2, 1, 1) &&
1427 read_write(server->tcpfd, payload, (c1 << 8) | c2, 1))
00a5b5d4 1428 {
b37f8b99 1429 m = (c1 << 8) | c2;
00a5b5d4 1430
b37f8b99
TH
1431 newhash = hash_questions(header, (unsigned int)m, name);
1432 if (newhash && memcmp(hash, newhash, HASH_SIZE) == 0)
00a5b5d4 1433 {
b37f8b99
TH
1434 /* Note this trashes all three name workspaces */
1435 status = tcp_key_recurse(now, STAT_NEED_DS_NEG, header, m, class, name, keyname, server, keycount);
00a5b5d4 1436
b37f8b99
TH
1437 /* We've found a DS which proves the bit of the DNS where the
1438 original query is, is unsigned, so the answer is OK,
1439 if unvalidated. */
1440 if (status == STAT_NO_DS)
00a5b5d4 1441 {
b37f8b99
TH
1442 free(packet);
1443 return STAT_INSECURE;
1444 }
1445
1446 /* No DS, not got to DNSSEC-land yet, go up. */
1447 if (status == STAT_INSECURE)
1448 {
1449 p = (unsigned char *)(header+1);
1450
1451 if (extract_name(header, plen, &p, name, 1, 4) &&
1452 (name_start = strchr(name, '.')))
1453 {
1454 name_start++; /* chop a label off and try again */
1455 continue;
1456 }
00a5b5d4
SK
1457 }
1458 }
1459 }
1460 }
1461
1462 free(packet);
1463
1464 return STAT_BOGUS;
1465 }
1466}
1467
7fa836e1
SK
1468static int tcp_key_recurse(time_t now, int status, struct dns_header *header, size_t n,
1469 int class, char *name, char *keyname, struct server *server, int *keycount)
7d7b7b31
SK
1470{
1471 /* Recurse up the key heirarchy */
7d7b7b31 1472 int new_status;
7d7b7b31 1473
7fa836e1
SK
1474 /* limit the amount of work we do, to avoid cycling forever on loops in the DNS */
1475 if (--(*keycount) == 0)
1476 return STAT_INSECURE;
7d7b7b31 1477
7fa836e1
SK
1478 if (status == STAT_NEED_KEY)
1479 new_status = dnssec_validate_by_ds(now, header, n, name, keyname, class);
00a5b5d4
SK
1480 else if (status == STAT_NEED_DS || status == STAT_NEED_DS_NEG)
1481 {
1482 new_status = dnssec_validate_ds(now, header, n, name, keyname, class);
1483 if (status == STAT_NEED_DS && new_status == STAT_NO_DS)
1484 new_status = STAT_INSECURE;
1485 }
1486 else if (status == STAT_CHASE_CNAME)
1487 new_status = dnssec_chase_cname(now, header, n, name, keyname);
1488 else
1489 {
1490 new_status = dnssec_validate_reply(now, header, n, name, keyname, &class, NULL);
1491
1492 if (new_status == STAT_NO_SIG)
1493 {
1494 if (option_bool(OPT_DNSSEC_NO_SIGN))
1495 new_status = tcp_check_for_unsigned_zone(now, header, n, class, name, keyname, server, keycount);
1496 else
1497 new_status = STAT_INSECURE;
1498 }
1499 }
1500
7fa836e1
SK
1501 /* Can't validate because we need a key/DS whose name now in keyname.
1502 Make query for same, and recurse to validate */
1503 if (new_status == STAT_NEED_DS || new_status == STAT_NEED_KEY)
7d7b7b31 1504 {
7fa836e1
SK
1505 size_t m;
1506 unsigned char *packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16));
1507 unsigned char *payload = &packet[2];
1508 struct dns_header *new_header = (struct dns_header *)payload;
1509 u16 *length = (u16 *)packet;
1510 unsigned char c1, c2;
1511
1512 if (!packet)
1513 return STAT_INSECURE;
1514
1515 another_tcp_key:
1516 m = dnssec_generate_query(new_header, ((char *) new_header) + 65536, keyname, class,
1517 new_status == STAT_NEED_KEY ? T_DNSKEY : T_DS, &server->addr);
7d7b7b31 1518
7fa836e1 1519 *length = htons(m);
7d7b7b31 1520
7fa836e1
SK
1521 if (!read_write(server->tcpfd, packet, m + sizeof(u16), 0) ||
1522 !read_write(server->tcpfd, &c1, 1, 1) ||
1523 !read_write(server->tcpfd, &c2, 1, 1) ||
1524 !read_write(server->tcpfd, payload, (c1 << 8) | c2, 1))
1525 new_status = STAT_INSECURE;
1526 else
7d7b7b31 1527 {
7fa836e1
SK
1528 m = (c1 << 8) | c2;
1529
00a5b5d4
SK
1530 new_status = tcp_key_recurse(now, new_status, new_header, m, class, name, keyname, server, keycount);
1531
1532 if (new_status == STAT_SECURE)
7d7b7b31 1533 {
7fa836e1
SK
1534 /* Reached a validated record, now try again at this level.
1535 Note that we may get ANOTHER NEED_* if an answer needs more than one key.
1536 If so, go round again. */
7d7b7b31 1537
7fa836e1
SK
1538 if (status == STAT_NEED_KEY)
1539 new_status = dnssec_validate_by_ds(now, header, n, name, keyname, class);
00a5b5d4
SK
1540 else if (status == STAT_NEED_DS || status == STAT_NEED_DS_NEG)
1541 {
1542 new_status = dnssec_validate_ds(now, header, n, name, keyname, class);
1543 if (status == STAT_NEED_DS && new_status == STAT_NO_DS)
1544 new_status = STAT_INSECURE; /* Validated no DS */
1545 }
1546 else if (status == STAT_CHASE_CNAME)
1547 new_status = dnssec_chase_cname(now, header, n, name, keyname);
1548 else
1549 {
1550 new_status = dnssec_validate_reply(now, header, n, name, keyname, &class, NULL);
1551
1552 if (new_status == STAT_NO_SIG)
1553 {
1554 if (option_bool(OPT_DNSSEC_NO_SIGN))
1555 new_status = tcp_check_for_unsigned_zone(now, header, n, class, name, keyname, server, keycount);
1556 else
1557 new_status = STAT_INSECURE;
1558 }
1559 }
1560
7d7b7b31 1561 if (new_status == STAT_NEED_DS || new_status == STAT_NEED_KEY)
7fa836e1 1562 goto another_tcp_key;
7d7b7b31
SK
1563 }
1564 }
7d7b7b31 1565
7fa836e1
SK
1566 free(packet);
1567 }
7d7b7b31
SK
1568 return new_status;
1569}
1570#endif
1571
1572
feba5c1d
SK
1573/* The daemon forks before calling this: it should deal with one connection,
1574 blocking as neccessary, and then return. Note, need to be a bit careful
1575 about resources for debug mode, when the fork is suppressed: that's
1576 done by the caller. */
5aabfc78 1577unsigned char *tcp_request(int confd, time_t now,
4f7b304f 1578 union mysockaddr *local_addr, struct in_addr netmask, int auth_dns)
feba5c1d 1579{
28866e95
SK
1580 size_t size = 0;
1581 int norebind = 0;
3b195961 1582#ifdef HAVE_AUTH
19b16891 1583 int local_auth = 0;
3b195961 1584#endif
613ad15d
SK
1585 int checking_disabled, ad_question, do_bit, added_pheader = 0;
1586 int check_subnet, no_cache_dnssec = 0, cache_secure = 0;
cdeda28f 1587 size_t m;
ee86ce68
SK
1588 unsigned short qtype;
1589 unsigned int gotname;
feba5c1d 1590 unsigned char c1, c2;
4b5ea12e
SK
1591 /* Max TCP packet + slop + size */
1592 unsigned char *packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16));
1593 unsigned char *payload = &packet[2];
1594 /* largest field in header is 16-bits, so this is still sufficiently aligned */
1595 struct dns_header *header = (struct dns_header *)payload;
1596 u16 *length = (u16 *)packet;
3be34541 1597 struct server *last_server;
7de060b0
SK
1598 struct in_addr dst_addr_4;
1599 union mysockaddr peer_addr;
1600 socklen_t peer_len = sizeof(union mysockaddr);
3be34541 1601
7de060b0
SK
1602 if (getpeername(confd, (struct sockaddr *)&peer_addr, &peer_len) == -1)
1603 return packet;
c8a80487
SK
1604
1605 /* We can be configured to only accept queries from at-most-one-hop-away addresses. */
1606 if (option_bool(OPT_LOCAL_SERVICE))
1607 {
1608 struct addrlist *addr;
1609#ifdef HAVE_IPV6
1610 if (peer_addr.sa.sa_family == AF_INET6)
1611 {
1612 for (addr = daemon->interface_addrs; addr; addr = addr->next)
1613 if ((addr->flags & ADDRLIST_IPV6) &&
1614 is_same_net6(&addr->addr.addr.addr6, &peer_addr.in6.sin6_addr, addr->prefixlen))
1615 break;
1616 }
1617 else
1618#endif
1619 {
1620 struct in_addr netmask;
1621 for (addr = daemon->interface_addrs; addr; addr = addr->next)
1622 {
1623 netmask.s_addr = 0xffffffff << (32 - addr->prefixlen);
1624 if (!(addr->flags & ADDRLIST_IPV6) &&
1625 is_same_net(addr->addr.addr.addr4, peer_addr.in.sin_addr, netmask))
1626 break;
1627 }
1628 }
1629 if (!addr)
1630 {
1631 my_syslog(LOG_WARNING, _("Ignoring query from non-local network"));
1632 return packet;
1633 }
1634 }
7de060b0 1635
feba5c1d
SK
1636 while (1)
1637 {
1638 if (!packet ||
1639 !read_write(confd, &c1, 1, 1) || !read_write(confd, &c2, 1, 1) ||
1640 !(size = c1 << 8 | c2) ||
4b5ea12e 1641 !read_write(confd, payload, size, 1))
feba5c1d
SK
1642 return packet;
1643
572b41eb 1644 if (size < (int)sizeof(struct dns_header))
feba5c1d
SK
1645 continue;
1646
ed4c0767
SK
1647 check_subnet = 0;
1648
28866e95 1649 /* save state of "cd" flag in query */
7d7b7b31
SK
1650 if ((checking_disabled = header->hb4 & HB4_CD))
1651 no_cache_dnssec = 1;
28866e95 1652
3be34541 1653 if ((gotname = extract_request(header, (unsigned int)size, daemon->namebuff, &qtype)))
feba5c1d 1654 {
b485ed97
SK
1655#ifdef HAVE_AUTH
1656 struct auth_zone *zone;
1657#endif
610e782a 1658 char *types = querystr(auth_dns ? "auth" : "query", qtype);
7de060b0
SK
1659
1660 if (peer_addr.sa.sa_family == AF_INET)
1661 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
1662 (struct all_addr *)&peer_addr.in.sin_addr, types);
feba5c1d 1663#ifdef HAVE_IPV6
7de060b0
SK
1664 else
1665 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
1666 (struct all_addr *)&peer_addr.in6.sin6_addr, types);
feba5c1d 1667#endif
b485ed97
SK
1668
1669#ifdef HAVE_AUTH
1670 /* find queries for zones we're authoritative for, and answer them directly */
6008bdbb
SK
1671 if (!auth_dns)
1672 for (zone = daemon->auth_zones; zone; zone = zone->next)
1673 if (in_zone(zone, daemon->namebuff, NULL))
1674 {
1675 auth_dns = 1;
1676 local_auth = 1;
1677 break;
1678 }
b485ed97 1679#endif
feba5c1d
SK
1680 }
1681
7de060b0
SK
1682 if (local_addr->sa.sa_family == AF_INET)
1683 dst_addr_4 = local_addr->in.sin_addr;
1684 else
1685 dst_addr_4.s_addr = 0;
1686
4820dce9 1687#ifdef HAVE_AUTH
4f7b304f 1688 if (auth_dns)
19b16891 1689 m = answer_auth(header, ((char *) header) + 65536, (size_t)size, now, &peer_addr, local_auth);
4f7b304f 1690 else
4820dce9 1691#endif
feba5c1d 1692 {
4f7b304f
SK
1693 /* m > 0 if answered from cache */
1694 m = answer_request(header, ((char *) header) + 65536, (size_t)size,
613ad15d 1695 dst_addr_4, netmask, now, &ad_question, &do_bit);
feba5c1d 1696
4f7b304f
SK
1697 /* Do this by steam now we're not in the select() loop */
1698 check_log_writer(NULL);
1699
1700 if (m == 0)
feba5c1d 1701 {
4f7b304f
SK
1702 unsigned int flags = 0;
1703 struct all_addr *addrp = NULL;
1704 int type = 0;
1705 char *domain = NULL;
feba5c1d 1706
4f7b304f
SK
1707 if (option_bool(OPT_ADD_MAC))
1708 size = add_mac(header, size, ((char *) header) + 65536, &peer_addr);
ed4c0767
SK
1709
1710 if (option_bool(OPT_CLIENT_SUBNET))
1711 {
1712 size_t new = add_source_addr(header, size, ((char *) header) + 65536, &peer_addr);
1713 if (size != new)
1714 {
1715 size = new;
1716 check_subnet = 1;
1717 }
1718 }
1719
4f7b304f
SK
1720 if (gotname)
1721 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
1722
1723 if (type != 0 || option_bool(OPT_ORDER) || !daemon->last_server)
1724 last_server = daemon->servers;
1725 else
1726 last_server = daemon->last_server;
1727
1728 if (!flags && last_server)
1729 {
1730 struct server *firstsendto = NULL;
8a9be9e4 1731#ifdef HAVE_DNSSEC
703c7ff4 1732 unsigned char *newhash, hash[HASH_SIZE];
8a9be9e4
SK
1733 if ((newhash = hash_questions(header, (unsigned int)size, daemon->keyname)))
1734 memcpy(hash, newhash, HASH_SIZE);
b37f8b99
TH
1735 else
1736 memset(hash, 0, HASH_SIZE);
8a9be9e4 1737#else
4f7b304f 1738 unsigned int crc = questions_crc(header, (unsigned int)size, daemon->namebuff);
8a9be9e4 1739#endif
4f7b304f
SK
1740 /* Loop round available servers until we succeed in connecting to one.
1741 Note that this code subtley ensures that consecutive queries on this connection
1742 which can go to the same server, do so. */
1743 while (1)
feba5c1d 1744 {
4f7b304f
SK
1745 if (!firstsendto)
1746 firstsendto = last_server;
1747 else
1748 {
1749 if (!(last_server = last_server->next))
1750 last_server = daemon->servers;
1751
1752 if (last_server == firstsendto)
1753 break;
1754 }
1755
1756 /* server for wrong domain */
1757 if (type != (last_server->flags & SERV_TYPE) ||
1758 (type == SERV_HAS_DOMAIN && !hostname_isequal(domain, last_server->domain)))
7de060b0
SK
1759 continue;
1760
4f7b304f 1761 if (last_server->tcpfd == -1)
7de060b0 1762 {
4f7b304f
SK
1763 if ((last_server->tcpfd = socket(last_server->addr.sa.sa_family, SOCK_STREAM, 0)) == -1)
1764 continue;
1765
1766 if ((!local_bind(last_server->tcpfd, &last_server->source_addr, last_server->interface, 1) ||
1767 connect(last_server->tcpfd, &last_server->addr.sa, sa_len(&last_server->addr)) == -1))
1768 {
1769 close(last_server->tcpfd);
1770 last_server->tcpfd = -1;
1771 continue;
1772 }
1773
7d7b7b31
SK
1774#ifdef HAVE_DNSSEC
1775 if (option_bool(OPT_DNSSEC_VALID))
1776 {
613ad15d
SK
1777 size_t new_size = add_do_bit(header, size, ((char *) header) + 65536);
1778
2ecd9bd5
SK
1779 /* For debugging, set Checking Disabled, otherwise, have the upstream check too,
1780 this allows it to select auth servers when one is returning bad data. */
1781 if (option_bool(OPT_DNSSEC_DEBUG))
1782 header->hb4 |= HB4_CD;
613ad15d
SK
1783
1784 if (size != new_size)
1785 added_pheader = 1;
1786
1787 size = new_size;
7d7b7b31
SK
1788 }
1789#endif
1790
7de060b0 1791#ifdef HAVE_CONNTRACK
4f7b304f
SK
1792 /* Copy connection mark of incoming query to outgoing connection. */
1793 if (option_bool(OPT_CONNTRACK))
1794 {
1795 unsigned int mark;
1796 struct all_addr local;
7de060b0 1797#ifdef HAVE_IPV6
4f7b304f
SK
1798 if (local_addr->sa.sa_family == AF_INET6)
1799 local.addr.addr6 = local_addr->in6.sin6_addr;
1800 else
7de060b0 1801#endif
4f7b304f
SK
1802 local.addr.addr4 = local_addr->in.sin_addr;
1803
1804 if (get_incoming_mark(&peer_addr, &local, 1, &mark))
1805 setsockopt(last_server->tcpfd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
1806 }
7de060b0 1807#endif
4f7b304f
SK
1808 }
1809
4b5ea12e 1810 *length = htons(size);
4f7b304f 1811
4b5ea12e 1812 if (!read_write(last_server->tcpfd, packet, size + sizeof(u16), 0) ||
4f7b304f 1813 !read_write(last_server->tcpfd, &c1, 1, 1) ||
7d7b7b31
SK
1814 !read_write(last_server->tcpfd, &c2, 1, 1) ||
1815 !read_write(last_server->tcpfd, payload, (c1 << 8) | c2, 1))
4f7b304f
SK
1816 {
1817 close(last_server->tcpfd);
1818 last_server->tcpfd = -1;
1819 continue;
1820 }
1821
1822 m = (c1 << 8) | c2;
4f7b304f
SK
1823
1824 if (!gotname)
1825 strcpy(daemon->namebuff, "query");
1826 if (last_server->addr.sa.sa_family == AF_INET)
1827 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
1828 (struct all_addr *)&last_server->addr.in.sin_addr, NULL);
feba5c1d 1829#ifdef HAVE_IPV6
4f7b304f
SK
1830 else
1831 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
1832 (struct all_addr *)&last_server->addr.in6.sin6_addr, NULL);
feba5c1d 1833#endif
7d7b7b31
SK
1834
1835#ifdef HAVE_DNSSEC
1836 if (option_bool(OPT_DNSSEC_VALID) && !checking_disabled)
1837 {
7fa836e1
SK
1838 int keycount = DNSSEC_WORK; /* Limit to number of DNSSEC questions, to catch loops and avoid filling cache. */
1839 int status = tcp_key_recurse(now, STAT_TRUNCATED, header, m, 0, daemon->namebuff, daemon->keyname, last_server, &keycount);
1840 char *result;
1841
1842 if (keycount == 0)
1843 result = "ABANDONED";
1844 else
1845 result = (status == STAT_SECURE ? "SECURE" : (status == STAT_INSECURE ? "INSECURE" : "BOGUS"));
7d7b7b31 1846
7fa836e1 1847 log_query(F_KEYTAG | F_SECSTAT, "result", NULL, result);
7d7b7b31 1848
7d7b7b31
SK
1849 if (status == STAT_BOGUS)
1850 no_cache_dnssec = 1;
7fa836e1 1851
7d7b7b31
SK
1852 if (status == STAT_SECURE)
1853 cache_secure = 1;
1854 }
1855#endif
1856
1857 /* restore CD bit to the value in the query */
1858 if (checking_disabled)
1859 header->hb4 |= HB4_CD;
1860 else
1861 header->hb4 &= ~HB4_CD;
4f7b304f
SK
1862
1863 /* There's no point in updating the cache, since this process will exit and
1864 lose the information after a few queries. We make this call for the alias and
1865 bogus-nxdomain side-effects. */
1866 /* If the crc of the question section doesn't match the crc we sent, then
1867 someone might be attempting to insert bogus values into the cache by
1868 sending replies containing questions and bogus answers. */
8a9be9e4
SK
1869#ifdef HAVE_DNSSEC
1870 newhash = hash_questions(header, (unsigned int)m, daemon->namebuff);
1871 if (!newhash || memcmp(hash, newhash, HASH_SIZE) != 0)
703c7ff4
SK
1872 {
1873 m = 0;
1874 break;
1875 }
8a9be9e4
SK
1876#else
1877 if (crc != questions_crc(header, (unsigned int)m, daemon->namebuff))
703c7ff4
SK
1878 {
1879 m = 0;
1880 break;
1881 }
8a9be9e4
SK
1882#endif
1883
1884 m = process_reply(header, now, last_server, (unsigned int)m,
1885 option_bool(OPT_NO_REBIND) && !norebind, no_cache_dnssec,
613ad15d 1886 cache_secure, ad_question, do_bit, added_pheader, check_subnet, &peer_addr);
4f7b304f
SK
1887
1888 break;
1889 }
feba5c1d 1890 }
4f7b304f
SK
1891
1892 /* In case of local answer or no connections made. */
1893 if (m == 0)
1894 m = setup_reply(header, (unsigned int)size, addrp, flags, daemon->local_ttl);
feba5c1d 1895 }
feba5c1d 1896 }
4f7b304f 1897
5aabfc78 1898 check_log_writer(NULL);
feba5c1d 1899
4b5ea12e
SK
1900 *length = htons(m);
1901
1902 if (m == 0 || !read_write(confd, packet, m + sizeof(u16), 0))
feba5c1d
SK
1903 return packet;
1904 }
1905}
1906
1697269c 1907static struct frec *allocate_frec(time_t now)
9e4abcb5 1908{
1697269c
SK
1909 struct frec *f;
1910
5aabfc78 1911 if ((f = (struct frec *)whine_malloc(sizeof(struct frec))))
9e4abcb5 1912 {
1a6bca81 1913 f->next = daemon->frec_list;
1697269c 1914 f->time = now;
832af0ba 1915 f->sentto = NULL;
1a6bca81 1916 f->rfd4 = NULL;
28866e95 1917 f->flags = 0;
1a6bca81
SK
1918#ifdef HAVE_IPV6
1919 f->rfd6 = NULL;
3a237152
SK
1920#endif
1921#ifdef HAVE_DNSSEC
97bc798b 1922 f->dependent = NULL;
3a237152 1923 f->blocking_query = NULL;
4619d946 1924 f->stash = NULL;
1a6bca81
SK
1925#endif
1926 daemon->frec_list = f;
1697269c 1927 }
9e4abcb5 1928
1697269c
SK
1929 return f;
1930}
9e4abcb5 1931
1a6bca81
SK
1932static struct randfd *allocate_rfd(int family)
1933{
1934 static int finger = 0;
1935 int i;
1936
1937 /* limit the number of sockets we have open to avoid starvation of
1938 (eg) TFTP. Once we have a reasonable number, randomness should be OK */
1939
1940 for (i = 0; i < RANDOM_SOCKS; i++)
9009d746 1941 if (daemon->randomsocks[i].refcount == 0)
1a6bca81 1942 {
9009d746
SK
1943 if ((daemon->randomsocks[i].fd = random_sock(family)) == -1)
1944 break;
1945
1a6bca81
SK
1946 daemon->randomsocks[i].refcount = 1;
1947 daemon->randomsocks[i].family = family;
1948 return &daemon->randomsocks[i];
1949 }
1950
9009d746 1951 /* No free ones or cannot get new socket, grab an existing one */
1a6bca81
SK
1952 for (i = 0; i < RANDOM_SOCKS; i++)
1953 {
1954 int j = (i+finger) % RANDOM_SOCKS;
9009d746
SK
1955 if (daemon->randomsocks[j].refcount != 0 &&
1956 daemon->randomsocks[j].family == family &&
1957 daemon->randomsocks[j].refcount != 0xffff)
1a6bca81
SK
1958 {
1959 finger = j;
1960 daemon->randomsocks[j].refcount++;
1961 return &daemon->randomsocks[j];
1962 }
1963 }
1964
1965 return NULL; /* doom */
1966}
1a6bca81
SK
1967static void free_frec(struct frec *f)
1968{
1969 if (f->rfd4 && --(f->rfd4->refcount) == 0)
1970 close(f->rfd4->fd);
1971
1972 f->rfd4 = NULL;
1973 f->sentto = NULL;
28866e95 1974 f->flags = 0;
1a6bca81
SK
1975
1976#ifdef HAVE_IPV6
1977 if (f->rfd6 && --(f->rfd6->refcount) == 0)
1978 close(f->rfd6->fd);
1979
1980 f->rfd6 = NULL;
1981#endif
3a237152
SK
1982
1983#ifdef HAVE_DNSSEC
1984 if (f->stash)
0fc2f313
SK
1985 {
1986 blockdata_free(f->stash);
1987 f->stash = NULL;
1988 }
3a237152
SK
1989
1990 /* Anything we're waiting on is pointless now, too */
1991 if (f->blocking_query)
1992 free_frec(f->blocking_query);
1993 f->blocking_query = NULL;
39048ad1 1994 f->dependent = NULL;
3a237152 1995#endif
1a6bca81
SK
1996}
1997
1697269c
SK
1998/* if wait==NULL return a free or older than TIMEOUT record.
1999 else return *wait zero if one available, or *wait is delay to
1a6bca81 2000 when the oldest in-use record will expire. Impose an absolute
3a237152
SK
2001 limit of 4*TIMEOUT before we wipe things (for random sockets).
2002 If force is set, always return a result, even if we have
2003 to allocate above the limit. */
2004struct frec *get_new_frec(time_t now, int *wait, int force)
1697269c 2005{
1a6bca81 2006 struct frec *f, *oldest, *target;
1697269c
SK
2007 int count;
2008
2009 if (wait)
2010 *wait = 0;
2011
1a6bca81 2012 for (f = daemon->frec_list, oldest = NULL, target = NULL, count = 0; f; f = f->next, count++)
832af0ba 2013 if (!f->sentto)
1a6bca81
SK
2014 target = f;
2015 else
1697269c 2016 {
1a6bca81
SK
2017 if (difftime(now, f->time) >= 4*TIMEOUT)
2018 {
2019 free_frec(f);
2020 target = f;
2021 }
2022
2023 if (!oldest || difftime(f->time, oldest->time) <= 0)
2024 oldest = f;
1697269c 2025 }
1a6bca81
SK
2026
2027 if (target)
2028 {
2029 target->time = now;
2030 return target;
2031 }
9e4abcb5
SK
2032
2033 /* can't find empty one, use oldest if there is one
2034 and it's older than timeout */
1697269c 2035 if (oldest && ((int)difftime(now, oldest->time)) >= TIMEOUT)
9e4abcb5 2036 {
1697269c
SK
2037 /* keep stuff for twice timeout if we can by allocating a new
2038 record instead */
2039 if (difftime(now, oldest->time) < 2*TIMEOUT &&
2040 count <= daemon->ftabsize &&
2041 (f = allocate_frec(now)))
2042 return f;
2043
2044 if (!wait)
2045 {
1a6bca81 2046 free_frec(oldest);
1697269c
SK
2047 oldest->time = now;
2048 }
9e4abcb5
SK
2049 return oldest;
2050 }
2051
1697269c 2052 /* none available, calculate time 'till oldest record expires */
3a237152 2053 if (!force && count > daemon->ftabsize)
1697269c 2054 {
0da5e897
MSB
2055 static time_t last_log = 0;
2056
1697269c
SK
2057 if (oldest && wait)
2058 *wait = oldest->time + (time_t)TIMEOUT - now;
0da5e897
MSB
2059
2060 if ((int)difftime(now, last_log) > 5)
2061 {
2062 last_log = now;
2063 my_syslog(LOG_WARNING, _("Maximum number of concurrent DNS queries reached (max: %d)"), daemon->ftabsize);
2064 }
2065
9e4abcb5
SK
2066 return NULL;
2067 }
1697269c
SK
2068
2069 if (!(f = allocate_frec(now)) && wait)
2070 /* wait one second on malloc failure */
2071 *wait = 1;
9e4abcb5 2072
9e4abcb5
SK
2073 return f; /* OK if malloc fails and this is NULL */
2074}
2075
832af0ba 2076/* crc is all-ones if not known. */
8a9be9e4 2077static struct frec *lookup_frec(unsigned short id, void *hash)
9e4abcb5
SK
2078{
2079 struct frec *f;
2080
1a6bca81 2081 for(f = daemon->frec_list; f; f = f->next)
832af0ba 2082 if (f->sentto && f->new_id == id &&
8a9be9e4 2083 (!hash || memcmp(hash, f->hash, HASH_SIZE) == 0))
9e4abcb5
SK
2084 return f;
2085
2086 return NULL;
2087}
2088
2089static struct frec *lookup_frec_by_sender(unsigned short id,
fd9fa481 2090 union mysockaddr *addr,
8a9be9e4 2091 void *hash)
9e4abcb5 2092{
feba5c1d
SK
2093 struct frec *f;
2094
1a6bca81 2095 for(f = daemon->frec_list; f; f = f->next)
832af0ba 2096 if (f->sentto &&
9e4abcb5 2097 f->orig_id == id &&
8a9be9e4 2098 memcmp(hash, f->hash, HASH_SIZE) == 0 &&
9e4abcb5
SK
2099 sockaddr_isequal(&f->source, addr))
2100 return f;
2101
2102 return NULL;
2103}
2104
849a8357 2105/* A server record is going away, remove references to it */
5aabfc78 2106void server_gone(struct server *server)
849a8357
SK
2107{
2108 struct frec *f;
2109
1a6bca81 2110 for (f = daemon->frec_list; f; f = f->next)
832af0ba 2111 if (f->sentto && f->sentto == server)
1a6bca81 2112 free_frec(f);
849a8357
SK
2113
2114 if (daemon->last_server == server)
2115 daemon->last_server = NULL;
2116
2117 if (daemon->srv_save == server)
2118 daemon->srv_save = NULL;
2119}
9e4abcb5 2120
316e2730 2121/* return unique random ids. */
8a9be9e4 2122static unsigned short get_id(void)
9e4abcb5
SK
2123{
2124 unsigned short ret = 0;
832af0ba 2125
316e2730 2126 do
832af0ba 2127 ret = rand16();
8a9be9e4 2128 while (lookup_frec(ret, NULL));
832af0ba 2129
9e4abcb5
SK
2130 return ret;
2131}
2132
2133
2134
2135
2136