]> git.ipfire.org Git - people/ms/dnsmasq.git/blame - src/forward.c
Reorder sanity checks on UDP packet reception, to cope with failed recvfrom()
[people/ms/dnsmasq.git] / src / forward.c
CommitLineData
c47e3ba4 1/* dnsmasq is Copyright (c) 2000-2014 Simon Kelley
9e4abcb5
SK
2
3 This program is free software; you can redistribute it and/or modify
4 it under the terms of the GNU General Public License as published by
824af85b
SK
5 the Free Software Foundation; version 2 dated June, 1991, or
6 (at your option) version 3 dated 29 June, 2007.
7
9e4abcb5
SK
8 This program is distributed in the hope that it will be useful,
9 but WITHOUT ANY WARRANTY; without even the implied warranty of
10 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11 GNU General Public License for more details.
824af85b 12
73a08a24
SK
13 You should have received a copy of the GNU General Public License
14 along with this program. If not, see <http://www.gnu.org/licenses/>.
9e4abcb5
SK
15*/
16
9e4abcb5
SK
17#include "dnsmasq.h"
18
8a9be9e4 19static struct frec *lookup_frec(unsigned short id, void *hash);
9e4abcb5 20static struct frec *lookup_frec_by_sender(unsigned short id,
fd9fa481 21 union mysockaddr *addr,
8a9be9e4
SK
22 void *hash);
23static unsigned short get_id(void);
1a6bca81
SK
24static void free_frec(struct frec *f);
25static struct randfd *allocate_rfd(int family);
9e4abcb5 26
00a5b5d4
SK
27#ifdef HAVE_DNSSEC
28static int tcp_key_recurse(time_t now, int status, struct dns_header *header, size_t n,
29 int class, char *name, char *keyname, struct server *server, int *keycount);
30static int do_check_sign(time_t now, struct dns_header *header, size_t plen, char *name, char *keyname, int class);
31static int send_check_sign(time_t now, struct dns_header *header, size_t plen, char *name, char *keyname);
32#endif
33
34
824af85b 35/* Send a UDP packet with its source address set as "source"
44a2a316 36 unless nowild is true, when we just send it with the kernel default */
29689cfa
SK
37int send_from(int fd, int nowild, char *packet, size_t len,
38 union mysockaddr *to, struct all_addr *source,
50303b19 39 unsigned int iface)
9e4abcb5 40{
44a2a316
SK
41 struct msghdr msg;
42 struct iovec iov[1];
44a2a316
SK
43 union {
44 struct cmsghdr align; /* this ensures alignment */
5e9e0efb 45#if defined(HAVE_LINUX_NETWORK)
44a2a316
SK
46 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
47#elif defined(IP_SENDSRCADDR)
48 char control[CMSG_SPACE(sizeof(struct in_addr))];
49#endif
50#ifdef HAVE_IPV6
51 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
52#endif
53 } control_u;
feba5c1d 54
44a2a316
SK
55 iov[0].iov_base = packet;
56 iov[0].iov_len = len;
57
feba5c1d
SK
58 msg.msg_control = NULL;
59 msg.msg_controllen = 0;
44a2a316
SK
60 msg.msg_flags = 0;
61 msg.msg_name = to;
62 msg.msg_namelen = sa_len(to);
63 msg.msg_iov = iov;
64 msg.msg_iovlen = 1;
feba5c1d 65
26128d27 66 if (!nowild)
44a2a316 67 {
26128d27 68 struct cmsghdr *cmptr;
feba5c1d
SK
69 msg.msg_control = &control_u;
70 msg.msg_controllen = sizeof(control_u);
26128d27
SK
71 cmptr = CMSG_FIRSTHDR(&msg);
72
73 if (to->sa.sa_family == AF_INET)
74 {
5e9e0efb 75#if defined(HAVE_LINUX_NETWORK)
8ef5ada2
SK
76 struct in_pktinfo p;
77 p.ipi_ifindex = 0;
78 p.ipi_spec_dst = source->addr.addr4;
79 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
26128d27 80 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_pktinfo));
c72daea8 81 cmptr->cmsg_level = IPPROTO_IP;
26128d27 82 cmptr->cmsg_type = IP_PKTINFO;
44a2a316 83#elif defined(IP_SENDSRCADDR)
8ef5ada2 84 memcpy(CMSG_DATA(cmptr), &(source->addr.addr4), sizeof(source->addr.addr4));
26128d27
SK
85 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_addr));
86 cmptr->cmsg_level = IPPROTO_IP;
87 cmptr->cmsg_type = IP_SENDSRCADDR;
44a2a316 88#endif
26128d27 89 }
26128d27 90 else
b8187c80 91#ifdef HAVE_IPV6
26128d27 92 {
8ef5ada2
SK
93 struct in6_pktinfo p;
94 p.ipi6_ifindex = iface; /* Need iface for IPv6 to handle link-local addrs */
95 p.ipi6_addr = source->addr.addr6;
96 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
26128d27 97 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in6_pktinfo));
316e2730 98 cmptr->cmsg_type = daemon->v6pktinfo;
c72daea8 99 cmptr->cmsg_level = IPPROTO_IPV6;
26128d27 100 }
3d8df260 101#else
c72daea8 102 (void)iface; /* eliminate warning */
44a2a316 103#endif
26128d27 104 }
feba5c1d 105
29d28dda 106 while (sendmsg(fd, &msg, 0) == -1)
feba5c1d 107 {
fd9fa481 108 if (retry_send())
29d28dda 109 continue;
22d904db 110
29d28dda
SK
111 /* If interface is still in DAD, EINVAL results - ignore that. */
112 if (errno == EINVAL)
113 break;
29689cfa 114
29d28dda 115 my_syslog(LOG_ERR, _("failed to send packet: %s"), strerror(errno));
29689cfa 116 return 0;
feba5c1d 117 }
29d28dda 118
29689cfa 119 return 1;
9e4abcb5 120}
44a2a316 121
28866e95
SK
122static unsigned int search_servers(time_t now, struct all_addr **addrpp,
123 unsigned int qtype, char *qdomain, int *type, char **domain, int *norebind)
feba5c1d
SK
124
125{
126 /* If the query ends in the domain in one of our servers, set
127 domain to point to that name. We find the largest match to allow both
128 domain.org and sub.domain.org to exist. */
129
130 unsigned int namelen = strlen(qdomain);
131 unsigned int matchlen = 0;
132 struct server *serv;
28866e95 133 unsigned int flags = 0;
feba5c1d 134
3be34541 135 for (serv = daemon->servers; serv; serv=serv->next)
feba5c1d 136 /* domain matches take priority over NODOTS matches */
3d8df260 137 if ((serv->flags & SERV_FOR_NODOTS) && *type != SERV_HAS_DOMAIN && !strchr(qdomain, '.') && namelen != 0)
feba5c1d 138 {
28866e95 139 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
feba5c1d 140 *type = SERV_FOR_NODOTS;
feba5c1d 141 if (serv->flags & SERV_NO_ADDR)
36717eee
SK
142 flags = F_NXDOMAIN;
143 else if (serv->flags & SERV_LITERAL_ADDRESS)
144 {
145 if (sflag & qtype)
146 {
147 flags = sflag;
148 if (serv->addr.sa.sa_family == AF_INET)
149 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
feba5c1d 150#ifdef HAVE_IPV6
36717eee
SK
151 else
152 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
feba5c1d 153#endif
36717eee 154 }
824af85b 155 else if (!flags || (flags & F_NXDOMAIN))
36717eee
SK
156 flags = F_NOERR;
157 }
feba5c1d
SK
158 }
159 else if (serv->flags & SERV_HAS_DOMAIN)
160 {
161 unsigned int domainlen = strlen(serv->domain);
b8187c80 162 char *matchstart = qdomain + namelen - domainlen;
feba5c1d 163 if (namelen >= domainlen &&
b8187c80 164 hostname_isequal(matchstart, serv->domain) &&
8ef5ada2 165 (domainlen == 0 || namelen == domainlen || *(matchstart-1) == '.' ))
feba5c1d 166 {
8ef5ada2
SK
167 if (serv->flags & SERV_NO_REBIND)
168 *norebind = 1;
28866e95 169 else
feba5c1d 170 {
28866e95
SK
171 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
172 /* implement priority rules for --address and --server for same domain.
173 --address wins if the address is for the correct AF
174 --server wins otherwise. */
175 if (domainlen != 0 && domainlen == matchlen)
36717eee 176 {
28866e95 177 if ((serv->flags & SERV_LITERAL_ADDRESS))
8ef5ada2 178 {
28866e95
SK
179 if (!(sflag & qtype) && flags == 0)
180 continue;
181 }
182 else
183 {
184 if (flags & (F_IPV4 | F_IPV6))
185 continue;
186 }
187 }
188
189 if (domainlen >= matchlen)
190 {
191 *type = serv->flags & (SERV_HAS_DOMAIN | SERV_USE_RESOLV | SERV_NO_REBIND);
192 *domain = serv->domain;
193 matchlen = domainlen;
194 if (serv->flags & SERV_NO_ADDR)
195 flags = F_NXDOMAIN;
196 else if (serv->flags & SERV_LITERAL_ADDRESS)
197 {
198 if (sflag & qtype)
199 {
200 flags = sflag;
201 if (serv->addr.sa.sa_family == AF_INET)
202 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
feba5c1d 203#ifdef HAVE_IPV6
28866e95
SK
204 else
205 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
feba5c1d 206#endif
28866e95
SK
207 }
208 else if (!flags || (flags & F_NXDOMAIN))
209 flags = F_NOERR;
8ef5ada2 210 }
28866e95
SK
211 else
212 flags = 0;
213 }
214 }
8ef5ada2 215 }
feba5c1d 216 }
8ef5ada2 217
7de060b0 218 if (flags == 0 && !(qtype & F_QUERY) &&
28866e95 219 option_bool(OPT_NODOTS_LOCAL) && !strchr(qdomain, '.') && namelen != 0)
7de060b0
SK
220 /* don't forward A or AAAA queries for simple names, except the empty name */
221 flags = F_NOERR;
8ef5ada2 222
5aabfc78 223 if (flags == F_NXDOMAIN && check_for_local_domain(qdomain, now))
c1bb8504 224 flags = F_NOERR;
feba5c1d 225
824af85b
SK
226 if (flags)
227 {
228 int logflags = 0;
229
230 if (flags == F_NXDOMAIN || flags == F_NOERR)
231 logflags = F_NEG | qtype;
232
1a6bca81 233 log_query(logflags | flags | F_CONFIG | F_FORWARD, qdomain, *addrpp, NULL);
824af85b 234 }
8ef5ada2
SK
235 else if ((*type) & SERV_USE_RESOLV)
236 {
237 *type = 0; /* use normal servers for this domain */
238 *domain = NULL;
239 }
feba5c1d
SK
240 return flags;
241}
44a2a316 242
824af85b
SK
243static int forward_query(int udpfd, union mysockaddr *udpaddr,
244 struct all_addr *dst_addr, unsigned int dst_iface,
83349b8a 245 struct dns_header *header, size_t plen, time_t now,
613ad15d 246 struct frec *forward, int ad_reqd, int do_bit)
9e4abcb5 247{
9e4abcb5 248 char *domain = NULL;
8ef5ada2 249 int type = 0, norebind = 0;
9e4abcb5 250 struct all_addr *addrp = NULL;
28866e95 251 unsigned int flags = 0;
de37951c 252 struct server *start = NULL;
8a9be9e4
SK
253#ifdef HAVE_DNSSEC
254 void *hash = hash_questions(header, plen, daemon->namebuff);
255#else
256 unsigned int crc = questions_crc(header, plen, daemon->namebuff);
257 void *hash = &crc;
258#endif
259 unsigned int gotname = extract_request(header, plen, daemon->namebuff, NULL);
260
00a5b5d4
SK
261 (void)do_bit;
262
3d8df260
SK
263 /* may be no servers available. */
264 if (!daemon->servers)
9e4abcb5 265 forward = NULL;
8a9be9e4 266 else if (forward || (hash && (forward = lookup_frec_by_sender(ntohs(header->id), udpaddr, hash))))
9e4abcb5 267 {
e0c0ad3b 268#ifdef HAVE_DNSSEC
dac74312 269 /* If we've already got an answer to this query, but we're awaiting keys for validation,
e0c0ad3b
SK
270 there's no point retrying the query, retry the key query instead...... */
271 if (forward->blocking_query)
272 {
273 int fd;
274
275 while (forward->blocking_query)
276 forward = forward->blocking_query;
277
278 blockdata_retrieve(forward->stash, forward->stash_len, (void *)header);
279 plen = forward->stash_len;
280
2b29191e 281 if (forward->sentto->addr.sa.sa_family == AF_INET)
e0c0ad3b
SK
282 log_query(F_DNSSEC | F_IPV4, "retry", (struct all_addr *)&forward->sentto->addr.in.sin_addr, "dnssec");
283#ifdef HAVE_IPV6
284 else
285 log_query(F_DNSSEC | F_IPV6, "retry", (struct all_addr *)&forward->sentto->addr.in6.sin6_addr, "dnssec");
286#endif
287
288 if (forward->sentto->sfd)
289 fd = forward->sentto->sfd->fd;
290 else
291 {
292#ifdef HAVE_IPV6
293 if (forward->sentto->addr.sa.sa_family == AF_INET6)
294 fd = forward->rfd6->fd;
295 else
296#endif
297 fd = forward->rfd4->fd;
298 }
299
300 while (sendto(fd, (char *)header, plen, 0,
301 &forward->sentto->addr.sa,
2b29191e 302 sa_len(&forward->sentto->addr)) == -1 && retry_send());
e0c0ad3b
SK
303
304 return 1;
305 }
306#endif
307
de37951c 308 /* retry on existing query, send to all available servers */
9e4abcb5 309 domain = forward->sentto->domain;
824af85b 310 forward->sentto->failed_queries++;
28866e95 311 if (!option_bool(OPT_ORDER))
de37951c 312 {
0a852541 313 forward->forwardall = 1;
3be34541 314 daemon->last_server = NULL;
de37951c 315 }
9e4abcb5 316 type = forward->sentto->flags & SERV_TYPE;
de37951c 317 if (!(start = forward->sentto->next))
3be34541 318 start = daemon->servers; /* at end of list, recycle */
9e4abcb5
SK
319 header->id = htons(forward->new_id);
320 }
321 else
322 {
323 if (gotname)
8ef5ada2 324 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
9e4abcb5 325
3a237152 326 if (!flags && !(forward = get_new_frec(now, NULL, 0)))
feba5c1d
SK
327 /* table full - server failure. */
328 flags = F_NEG;
9e4abcb5
SK
329
330 if (forward)
331 {
0a852541
SK
332 forward->source = *udpaddr;
333 forward->dest = *dst_addr;
334 forward->iface = dst_iface;
0a852541 335 forward->orig_id = ntohs(header->id);
8a9be9e4 336 forward->new_id = get_id();
832af0ba 337 forward->fd = udpfd;
8a9be9e4 338 memcpy(forward->hash, hash, HASH_SIZE);
0a852541 339 forward->forwardall = 0;
ed4c0767 340 forward->flags = 0;
28866e95
SK
341 if (norebind)
342 forward->flags |= FREC_NOREBIND;
572b41eb 343 if (header->hb4 & HB4_CD)
28866e95 344 forward->flags |= FREC_CHECKING_DISABLED;
83349b8a
SK
345 if (ad_reqd)
346 forward->flags |= FREC_AD_QUESTION;
7fa836e1
SK
347#ifdef HAVE_DNSSEC
348 forward->work_counter = DNSSEC_WORK;
613ad15d
SK
349 if (do_bit)
350 forward->flags |= FREC_DO_QUESTION;
7fa836e1 351#endif
613ad15d 352
28866e95
SK
353 header->id = htons(forward->new_id);
354
8ef5ada2
SK
355 /* In strict_order mode, always try servers in the order
356 specified in resolv.conf, if a domain is given
357 always try all the available servers,
9e4abcb5
SK
358 otherwise, use the one last known to work. */
359
8ef5ada2
SK
360 if (type == 0)
361 {
28866e95 362 if (option_bool(OPT_ORDER))
8ef5ada2
SK
363 start = daemon->servers;
364 else if (!(start = daemon->last_server) ||
365 daemon->forwardcount++ > FORWARD_TEST ||
366 difftime(now, daemon->forwardtime) > FORWARD_TIME)
367 {
368 start = daemon->servers;
369 forward->forwardall = 1;
370 daemon->forwardcount = 0;
371 daemon->forwardtime = now;
372 }
373 }
374 else
de37951c 375 {
3be34541 376 start = daemon->servers;
28866e95 377 if (!option_bool(OPT_ORDER))
8ef5ada2 378 forward->forwardall = 1;
de37951c 379 }
9e4abcb5
SK
380 }
381 }
feba5c1d 382
9e4abcb5
SK
383 /* check for send errors here (no route to host)
384 if we fail to send to all nameservers, send back an error
385 packet straight away (helps modem users when offline) */
386
387 if (!flags && forward)
388 {
de37951c
SK
389 struct server *firstsentto = start;
390 int forwarded = 0;
28866e95 391
797a7afb 392 if (option_bool(OPT_ADD_MAC))
60b68069 393 plen = add_mac(header, plen, ((char *) header) + daemon->packet_buff_sz, &forward->source);
28866e95 394
ed4c0767
SK
395 if (option_bool(OPT_CLIENT_SUBNET))
396 {
60b68069 397 size_t new = add_source_addr(header, plen, ((char *) header) + daemon->packet_buff_sz, &forward->source);
ed4c0767
SK
398 if (new != plen)
399 {
400 plen = new;
401 forward->flags |= FREC_HAS_SUBNET;
402 }
403 }
404
3a237152
SK
405#ifdef HAVE_DNSSEC
406 if (option_bool(OPT_DNSSEC_VALID))
0fc2f313 407 {
613ad15d
SK
408 size_t new_plen = add_do_bit(header, plen, ((char *) header) + daemon->packet_buff_sz);
409
5b3bf921
SK
410 /* For debugging, set Checking Disabled, otherwise, have the upstream check too,
411 this allows it to select auth servers when one is returning bad data. */
412 if (option_bool(OPT_DNSSEC_DEBUG))
413 header->hb4 |= HB4_CD;
613ad15d
SK
414
415 if (new_plen != plen)
416 forward->flags |= FREC_ADDED_PHEADER;
417
418 plen = new_plen;
0fc2f313 419 }
3a237152
SK
420#endif
421
9e4abcb5
SK
422 while (1)
423 {
9e4abcb5
SK
424 /* only send to servers dealing with our domain.
425 domain may be NULL, in which case server->domain
426 must be NULL also. */
427
de37951c 428 if (type == (start->flags & SERV_TYPE) &&
fd9fa481
SK
429 (type != SERV_HAS_DOMAIN || hostname_isequal(domain, start->domain)) &&
430 !(start->flags & SERV_LITERAL_ADDRESS))
9e4abcb5 431 {
1a6bca81
SK
432 int fd;
433
434 /* find server socket to use, may need to get random one. */
435 if (start->sfd)
436 fd = start->sfd->fd;
437 else
438 {
439#ifdef HAVE_IPV6
440 if (start->addr.sa.sa_family == AF_INET6)
441 {
442 if (!forward->rfd6 &&
443 !(forward->rfd6 = allocate_rfd(AF_INET6)))
444 break;
3927da46 445 daemon->rfd_save = forward->rfd6;
1a6bca81
SK
446 fd = forward->rfd6->fd;
447 }
448 else
449#endif
450 {
451 if (!forward->rfd4 &&
452 !(forward->rfd4 = allocate_rfd(AF_INET)))
453 break;
3927da46 454 daemon->rfd_save = forward->rfd4;
1a6bca81
SK
455 fd = forward->rfd4->fd;
456 }
7de060b0
SK
457
458#ifdef HAVE_CONNTRACK
459 /* Copy connection mark of incoming query to outgoing connection. */
460 if (option_bool(OPT_CONNTRACK))
461 {
462 unsigned int mark;
797a7afb 463 if (get_incoming_mark(&forward->source, &forward->dest, 0, &mark))
7de060b0
SK
464 setsockopt(fd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
465 }
466#endif
1a6bca81
SK
467 }
468
469 if (sendto(fd, (char *)header, plen, 0,
feba5c1d 470 &start->addr.sa,
fd9fa481
SK
471 sa_len(&start->addr)) == -1)
472 {
473 if (retry_send())
474 continue;
475 }
476 else
9e4abcb5 477 {
cdeda28f
SK
478 /* Keep info in case we want to re-send this packet */
479 daemon->srv_save = start;
480 daemon->packet_len = plen;
481
de37951c 482 if (!gotname)
3be34541 483 strcpy(daemon->namebuff, "query");
de37951c 484 if (start->addr.sa.sa_family == AF_INET)
3be34541 485 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
1a6bca81 486 (struct all_addr *)&start->addr.in.sin_addr, NULL);
de37951c
SK
487#ifdef HAVE_IPV6
488 else
3be34541 489 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
1a6bca81 490 (struct all_addr *)&start->addr.in6.sin6_addr, NULL);
de37951c 491#endif
824af85b 492 start->queries++;
de37951c
SK
493 forwarded = 1;
494 forward->sentto = start;
0a852541 495 if (!forward->forwardall)
de37951c 496 break;
0a852541 497 forward->forwardall++;
9e4abcb5
SK
498 }
499 }
500
de37951c 501 if (!(start = start->next))
3be34541 502 start = daemon->servers;
9e4abcb5 503
de37951c 504 if (start == firstsentto)
9e4abcb5
SK
505 break;
506 }
507
de37951c 508 if (forwarded)
824af85b 509 return 1;
de37951c 510
9e4abcb5
SK
511 /* could not send on, prepare to return */
512 header->id = htons(forward->orig_id);
1a6bca81 513 free_frec(forward); /* cancel */
9e4abcb5
SK
514 }
515
516 /* could not send on, return empty answer or address if known for whole domain */
b8187c80
SK
517 if (udpfd != -1)
518 {
cdeda28f 519 plen = setup_reply(header, plen, addrp, flags, daemon->local_ttl);
54dd393f 520 send_from(udpfd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND), (char *)header, plen, udpaddr, dst_addr, dst_iface);
b8187c80
SK
521 }
522
824af85b 523 return 0;
9e4abcb5
SK
524}
525
ed4c0767 526static size_t process_reply(struct dns_header *header, time_t now, struct server *server, size_t n, int check_rebind,
613ad15d 527 int no_cache, int cache_secure, int ad_reqd, int do_bit, int added_pheader, int check_subnet, union mysockaddr *query_source)
feba5c1d 528{
36717eee 529 unsigned char *pheader, *sizep;
13d86c73 530 char **sets = 0;
832af0ba 531 int munged = 0, is_sign;
cdeda28f
SK
532 size_t plen;
533
83349b8a 534 (void)ad_reqd;
00a5b5d4 535 (void) do_bit;
83349b8a 536
13d86c73
JD
537#ifdef HAVE_IPSET
538 /* Similar algorithm to search_servers. */
539 struct ipsets *ipset_pos;
540 unsigned int namelen = strlen(daemon->namebuff);
541 unsigned int matchlen = 0;
542 for (ipset_pos = daemon->ipsets; ipset_pos; ipset_pos = ipset_pos->next)
543 {
544 unsigned int domainlen = strlen(ipset_pos->domain);
545 char *matchstart = daemon->namebuff + namelen - domainlen;
546 if (namelen >= domainlen && hostname_isequal(matchstart, ipset_pos->domain) &&
547 (domainlen == 0 || namelen == domainlen || *(matchstart - 1) == '.' ) &&
6c0cb858
SK
548 domainlen >= matchlen)
549 {
550 matchlen = domainlen;
551 sets = ipset_pos->sets;
552 }
13d86c73
JD
553 }
554#endif
555
feba5c1d 556 /* If upstream is advertising a larger UDP packet size
9009d746
SK
557 than we allow, trim it so that we don't get overlarge
558 requests for the client. We can't do this for signed packets. */
feba5c1d 559
ed4c0767 560 if ((pheader = find_pseudoheader(header, n, &plen, &sizep, &is_sign)))
feba5c1d 561 {
83349b8a
SK
562 unsigned short udpsz;
563 unsigned char *psave = sizep;
564
565 GETSHORT(udpsz, sizep);
566
567 if (!is_sign && udpsz > daemon->edns_pktsz)
568 PUTSHORT(daemon->edns_pktsz, psave);
feba5c1d 569
ed4c0767
SK
570 if (check_subnet && !check_source(header, plen, pheader, query_source))
571 {
572 my_syslog(LOG_WARNING, _("discarding DNS reply: subnet option mismatch"));
573 return 0;
574 }
613ad15d
SK
575
576 if (added_pheader)
577 {
578 pheader = 0;
579 header->arcount = htons(0);
580 }
feba5c1d 581 }
83349b8a 582
28866e95 583 /* RFC 4035 sect 4.6 para 3 */
237724c0 584 if (!is_sign && !option_bool(OPT_DNSSEC_PROXY))
795501bc 585 header->hb4 &= ~HB4_AD;
3a237152 586
572b41eb 587 if (OPCODE(header) != QUERY || (RCODE(header) != NOERROR && RCODE(header) != NXDOMAIN))
0a852541
SK
588 return n;
589
feba5c1d 590 /* Complain loudly if the upstream server is non-recursive. */
572b41eb 591 if (!(header->hb4 & HB4_RA) && RCODE(header) == NOERROR && ntohs(header->ancount) == 0 &&
0a852541 592 server && !(server->flags & SERV_WARNED_RECURSIVE))
feba5c1d 593 {
3d8df260 594 prettyprint_addr(&server->addr, daemon->namebuff);
f2621c7f 595 my_syslog(LOG_WARNING, _("nameserver %s refused to do a recursive query"), daemon->namebuff);
28866e95 596 if (!option_bool(OPT_LOG))
0a852541
SK
597 server->flags |= SERV_WARNED_RECURSIVE;
598 }
e292e93d 599
572b41eb 600 if (daemon->bogus_addr && RCODE(header) != NXDOMAIN &&
fd9fa481 601 check_for_bogus_wildcard(header, n, daemon->namebuff, daemon->bogus_addr, now))
feba5c1d 602 {
fd9fa481 603 munged = 1;
572b41eb
SK
604 SET_RCODE(header, NXDOMAIN);
605 header->hb3 &= ~HB3_AA;
6938f347 606 cache_secure = 0;
36717eee 607 }
fd9fa481 608 else
36717eee 609 {
6938f347
SK
610 int doctored = 0;
611
572b41eb 612 if (RCODE(header) == NXDOMAIN &&
fd9fa481 613 extract_request(header, n, daemon->namebuff, NULL) &&
5aabfc78 614 check_for_local_domain(daemon->namebuff, now))
36717eee
SK
615 {
616 /* if we forwarded a query for a locally known name (because it was for
617 an unknown type) and the answer is NXDOMAIN, convert that to NODATA,
618 since we know that the domain exists, even if upstream doesn't */
fd9fa481 619 munged = 1;
572b41eb
SK
620 header->hb3 |= HB3_AA;
621 SET_RCODE(header, NOERROR);
6938f347 622 cache_secure = 0;
feba5c1d 623 }
832af0ba 624
6938f347 625 if (extract_addresses(header, n, daemon->namebuff, now, sets, is_sign, check_rebind, no_cache, cache_secure, &doctored))
824af85b 626 {
8ef5ada2 627 my_syslog(LOG_WARNING, _("possible DNS-rebind attack detected: %s"), daemon->namebuff);
824af85b 628 munged = 1;
6938f347 629 cache_secure = 0;
824af85b 630 }
6938f347
SK
631
632 if (doctored)
633 cache_secure = 0;
feba5c1d 634 }
fd9fa481 635
a25720a3
SK
636#ifdef HAVE_DNSSEC
637 if (no_cache && !(header->hb4 & HB4_CD))
638 {
7d23a66f 639 if (!option_bool(OPT_DNSSEC_DEBUG))
a25720a3
SK
640 {
641 /* Bogus reply, turn into SERVFAIL */
642 SET_RCODE(header, SERVFAIL);
643 munged = 1;
644 }
645 }
6938f347
SK
646
647 if (option_bool(OPT_DNSSEC_VALID))
648 header->hb4 &= ~HB4_AD;
649
83349b8a 650 if (!(header->hb4 & HB4_CD) && ad_reqd && cache_secure)
6938f347 651 header->hb4 |= HB4_AD;
613ad15d
SK
652
653 /* If the requestor didn't set the DO bit, don't return DNSSEC info. */
654 if (!do_bit)
655 n = filter_rrsigs(header, n);
a25720a3
SK
656#endif
657
fd9fa481
SK
658 /* do this after extract_addresses. Ensure NODATA reply and remove
659 nameserver info. */
660
661 if (munged)
662 {
663 header->ancount = htons(0);
664 header->nscount = htons(0);
665 header->arcount = htons(0);
666 }
667
36717eee
SK
668 /* the bogus-nxdomain stuff, doctor and NXDOMAIN->NODATA munging can all elide
669 sections of the packet. Find the new length here and put back pseudoheader
670 if it was removed. */
671 return resize_packet(header, n, pheader, plen);
feba5c1d
SK
672}
673
3be34541 674/* sets new last_server */
1a6bca81 675void reply_query(int fd, int family, time_t now)
9e4abcb5
SK
676{
677 /* packet from peer server, extract data for cache, and send to
678 original requester */
572b41eb 679 struct dns_header *header;
de37951c 680 union mysockaddr serveraddr;
832af0ba 681 struct frec *forward;
de37951c 682 socklen_t addrlen = sizeof(serveraddr);
60b68069 683 ssize_t n = recvfrom(fd, daemon->packet, daemon->packet_buff_sz, 0, &serveraddr.sa, &addrlen);
cdeda28f 684 size_t nn;
1a6bca81 685 struct server *server;
8a9be9e4
SK
686 void *hash;
687#ifndef HAVE_DNSSEC
688 unsigned int crc;
689#endif
690
cdeda28f
SK
691 /* packet buffer overwritten */
692 daemon->srv_save = NULL;
832af0ba 693
de37951c 694 /* Determine the address of the server replying so that we can mark that as good */
1a6bca81 695 serveraddr.sa.sa_family = family;
de37951c
SK
696#ifdef HAVE_IPV6
697 if (serveraddr.sa.sa_family == AF_INET6)
5e9e0efb 698 serveraddr.in6.sin6_flowinfo = 0;
de37951c 699#endif
9e4abcb5 700
490f9075
SK
701 header = (struct dns_header *)daemon->packet;
702
703 if (n < (int)sizeof(struct dns_header) || !(header->hb3 & HB3_QR))
704 return;
705
1a6bca81
SK
706 /* spoof check: answer must come from known server, */
707 for (server = daemon->servers; server; server = server->next)
708 if (!(server->flags & (SERV_LITERAL_ADDRESS | SERV_NO_ADDR)) &&
709 sockaddr_isequal(&server->addr, &serveraddr))
710 break;
490f9075
SK
711
712 if (!server)
713 return;
714
8a9be9e4
SK
715#ifdef HAVE_DNSSEC
716 hash = hash_questions(header, n, daemon->namebuff);
717#else
718 hash = &crc;
719 crc = questions_crc(header, n, daemon->namebuff);
720#endif
fd9fa481 721
490f9075 722 if (!(forward = lookup_frec(ntohs(header->id), hash)))
1a6bca81 723 return;
490f9075 724
572b41eb 725 if ((RCODE(header) == SERVFAIL || RCODE(header) == REFUSED) &&
28866e95 726 !option_bool(OPT_ORDER) &&
1a6bca81
SK
727 forward->forwardall == 0)
728 /* for broken servers, attempt to send to another one. */
9e4abcb5 729 {
1a6bca81
SK
730 unsigned char *pheader;
731 size_t plen;
732 int is_sign;
832af0ba 733
1a6bca81
SK
734 /* recreate query from reply */
735 pheader = find_pseudoheader(header, (size_t)n, &plen, NULL, &is_sign);
736 if (!is_sign)
832af0ba 737 {
1a6bca81
SK
738 header->ancount = htons(0);
739 header->nscount = htons(0);
740 header->arcount = htons(0);
741 if ((nn = resize_packet(header, (size_t)n, pheader, plen)))
832af0ba 742 {
572b41eb 743 header->hb3 &= ~(HB3_QR | HB3_TC);
613ad15d 744 forward_query(-1, NULL, NULL, 0, header, nn, now, forward, 0, 0);
1a6bca81 745 return;
832af0ba 746 }
832af0ba 747 }
1a6bca81 748 }
3a237152
SK
749
750 server = forward->sentto;
1a6bca81
SK
751
752 if ((forward->sentto->flags & SERV_TYPE) == 0)
753 {
572b41eb 754 if (RCODE(header) == SERVFAIL || RCODE(header) == REFUSED)
1a6bca81
SK
755 server = NULL;
756 else
b8187c80 757 {
1a6bca81
SK
758 struct server *last_server;
759
760 /* find good server by address if possible, otherwise assume the last one we sent to */
761 for (last_server = daemon->servers; last_server; last_server = last_server->next)
762 if (!(last_server->flags & (SERV_LITERAL_ADDRESS | SERV_HAS_DOMAIN | SERV_FOR_NODOTS | SERV_NO_ADDR)) &&
763 sockaddr_isequal(&last_server->addr, &serveraddr))
764 {
765 server = last_server;
766 break;
767 }
768 }
28866e95 769 if (!option_bool(OPT_ALL_SERVERS))
1a6bca81
SK
770 daemon->last_server = server;
771 }
3a237152 772
1a6bca81
SK
773 /* If the answer is an error, keep the forward record in place in case
774 we get a good reply from another server. Kill it when we've
775 had replies from all to avoid filling the forwarding table when
776 everything is broken */
777 if (forward->forwardall == 0 || --forward->forwardall == 1 ||
572b41eb 778 (RCODE(header) != REFUSED && RCODE(header) != SERVFAIL))
1a6bca81 779 {
3a237152
SK
780 int check_rebind = 0, no_cache_dnssec = 0, cache_secure = 0;
781
782 if (option_bool(OPT_NO_REBIND))
783 check_rebind = !(forward->flags & FREC_NOREBIND);
784
785 /* Don't cache replies where DNSSEC validation was turned off, either
786 the upstream server told us so, or the original query specified it. */
787 if ((header->hb4 & HB4_CD) || (forward->flags & FREC_CHECKING_DISABLED))
788 no_cache_dnssec = 1;
789
790#ifdef HAVE_DNSSEC
791 if (option_bool(OPT_DNSSEC_VALID) && !(forward->flags & FREC_CHECKING_DISABLED))
792 {
9d633048 793 int status;
0fc2f313
SK
794
795 /* We've had a reply already, which we're validating. Ignore this duplicate */
e0c0ad3b 796 if (forward->blocking_query)
0fc2f313 797 return;
9d633048 798
871417d4
SK
799 if (header->hb3 & HB3_TC)
800 {
801 /* Truncated answer can't be validated.
5d3b87a4
SK
802 If this is an answer to a DNSSEC-generated query, we still
803 need to get the client to retry over TCP, so return
804 an answer with the TC bit set, even if the actual answer fits.
805 */
806 status = STAT_TRUNCATED;
871417d4
SK
807 }
808 else if (forward->flags & FREC_DNSKEY_QUERY)
8d718cbb 809 status = dnssec_validate_by_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
c3e0b9b6 810 else if (forward->flags & FREC_DS_QUERY)
00a5b5d4
SK
811 {
812 status = dnssec_validate_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
813 if (status == STAT_NO_DS)
814 status = STAT_INSECURE;
815 }
816 else if (forward->flags & FREC_CHECK_NOSIGN)
817 status = do_check_sign(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
9d633048 818 else
00a5b5d4
SK
819 {
820 status = dnssec_validate_reply(now, header, n, daemon->namebuff, daemon->keyname, &forward->class, NULL);
821 if (status == STAT_NO_SIG)
822 {
823 if (option_bool(OPT_DNSSEC_NO_SIGN))
824 status = send_check_sign(now, header, n, daemon->namebuff, daemon->keyname);
825 else
826 status = STAT_INSECURE;
827 }
828 }
3a237152
SK
829 /* Can't validate, as we're missing key data. Put this
830 answer aside, whilst we get that. */
00a5b5d4 831 if (status == STAT_NEED_DS || status == STAT_NEED_DS_NEG || status == STAT_NEED_KEY)
3a237152 832 {
7fa836e1
SK
833 struct frec *new, *orig;
834
835 /* Free any saved query */
836 if (forward->stash)
837 blockdata_free(forward->stash);
838
839 /* Now save reply pending receipt of key data */
840 if (!(forward->stash = blockdata_alloc((char *)header, n)))
841 return;
842 forward->stash_len = n;
0fc2f313 843
7fa836e1
SK
844 anotherkey:
845 /* Find the original query that started it all.... */
846 for (orig = forward; orig->dependent; orig = orig->dependent);
847
848 if (--orig->work_counter == 0 || !(new = get_new_frec(now, NULL, 1)))
849 status = STAT_INSECURE;
850 else
3a237152 851 {
7fa836e1 852 int fd;
0fc2f313
SK
853 struct frec *next = new->next;
854 *new = *forward; /* copy everything, then overwrite */
855 new->next = next;
0fc2f313 856 new->blocking_query = NULL;
f1668d27
SK
857 new->rfd4 = NULL;
858#ifdef HAVE_IPV6
859 new->rfd6 = NULL;
860#endif
00a5b5d4 861 new->flags &= ~(FREC_DNSKEY_QUERY | FREC_DS_QUERY | FREC_CHECK_NOSIGN);
9d633048 862
7fa836e1
SK
863 new->dependent = forward; /* to find query awaiting new one. */
864 forward->blocking_query = new; /* for garbage cleaning */
865 /* validate routines leave name of required record in daemon->keyname */
866 if (status == STAT_NEED_KEY)
867 {
868 new->flags |= FREC_DNSKEY_QUERY;
869 nn = dnssec_generate_query(header, ((char *) header) + daemon->packet_buff_sz,
870 daemon->keyname, forward->class, T_DNSKEY, &server->addr);
871 }
872 else
873 {
00a5b5d4
SK
874 if (status == STAT_NEED_DS_NEG)
875 new->flags |= FREC_CHECK_NOSIGN;
876 else
877 new->flags |= FREC_DS_QUERY;
7fa836e1
SK
878 nn = dnssec_generate_query(header,((char *) header) + daemon->packet_buff_sz,
879 daemon->keyname, forward->class, T_DS, &server->addr);
880 }
881 if ((hash = hash_questions(header, nn, daemon->namebuff)))
882 memcpy(new->hash, hash, HASH_SIZE);
883 new->new_id = get_id();
884 header->id = htons(new->new_id);
885 /* Save query for retransmission */
886 new->stash = blockdata_alloc((char *)header, nn);
887 new->stash_len = nn;
888
889 /* Don't resend this. */
890 daemon->srv_save = NULL;
e0c0ad3b 891
7fa836e1
SK
892 if (server->sfd)
893 fd = server->sfd->fd;
e0c0ad3b 894 else
3a237152 895 {
7fa836e1
SK
896 fd = -1;
897#ifdef HAVE_IPV6
898 if (server->addr.sa.sa_family == AF_INET6)
9d633048 899 {
7fa836e1
SK
900 if (new->rfd6 || (new->rfd6 = allocate_rfd(AF_INET6)))
901 fd = new->rfd6->fd;
9d633048 902 }
3a237152 903 else
3a237152 904#endif
f1668d27 905 {
7fa836e1
SK
906 if (new->rfd4 || (new->rfd4 = allocate_rfd(AF_INET)))
907 fd = new->rfd4->fd;
f1668d27 908 }
3a237152 909 }
7fa836e1
SK
910
911 if (fd != -1)
912 {
913 while (sendto(fd, (char *)header, nn, 0, &server->addr.sa, sa_len(&server->addr)) == -1 && retry_send());
914 server->queries++;
915 }
916
917 return;
3a237152 918 }
3a237152
SK
919 }
920
921 /* Ok, we reached far enough up the chain-of-trust that we can validate something.
922 Now wind back down, pulling back answers which wouldn't previously validate
7fa836e1
SK
923 and validate them with the new data. Note that if an answer needs multiple
924 keys to validate, we may find another key is needed, in which case we set off
925 down another branch of the tree. Once we get to the original answer
926 (FREC_DNSSEC_QUERY not set) and it validates, return it to the original requestor. */
0744ca66 927 while (forward->dependent)
3a237152 928 {
0744ca66
SK
929 struct frec *prev = forward->dependent;
930 free_frec(forward);
931 forward = prev;
932 forward->blocking_query = NULL; /* already gone */
933 blockdata_retrieve(forward->stash, forward->stash_len, (void *)header);
934 n = forward->stash_len;
935
936 if (status == STAT_SECURE)
3a237152 937 {
0744ca66
SK
938 if (forward->flags & FREC_DNSKEY_QUERY)
939 status = dnssec_validate_by_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
940 else if (forward->flags & FREC_DS_QUERY)
00a5b5d4
SK
941 {
942 status = dnssec_validate_ds(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
943 if (status == STAT_NO_DS)
944 status = STAT_INSECURE;
945 }
946 else if (forward->flags & FREC_CHECK_NOSIGN)
947 status = do_check_sign(now, header, n, daemon->namebuff, daemon->keyname, forward->class);
0744ca66 948 else
00a5b5d4
SK
949 {
950 status = dnssec_validate_reply(now, header, n, daemon->namebuff, daemon->keyname, &forward->class, NULL);
951 if (status == STAT_NO_SIG)
952 {
953 if (option_bool(OPT_DNSSEC_NO_SIGN))
954 status = send_check_sign(now, header, n, daemon->namebuff, daemon->keyname);
955 else
956 status = STAT_INSECURE;
957 }
958 }
959
960 if (status == STAT_NEED_DS || status == STAT_NEED_DS_NEG || status == STAT_NEED_KEY)
7fa836e1 961 goto anotherkey;
3a237152
SK
962 }
963 }
5d3b87a4
SK
964
965 if (status == STAT_TRUNCATED)
0744ca66 966 header->hb3 |= HB3_TC;
5d3b87a4 967 else
7fa836e1
SK
968 {
969 char *result;
970
971 if (forward->work_counter == 0)
972 result = "ABANDONED";
973 else
974 result = (status == STAT_SECURE ? "SECURE" : (status == STAT_INSECURE ? "INSECURE" : "BOGUS"));
975
976 log_query(F_KEYTAG | F_SECSTAT, "result", NULL, result);
977 }
5d3b87a4 978
0fc2f313 979 no_cache_dnssec = 0;
5d3b87a4 980
3a237152
SK
981 if (status == STAT_SECURE)
982 cache_secure = 1;
3a237152
SK
983 else if (status == STAT_BOGUS)
984 no_cache_dnssec = 1;
985 }
83349b8a
SK
986#endif
987
988 /* restore CD bit to the value in the query */
989 if (forward->flags & FREC_CHECKING_DISABLED)
990 header->hb4 |= HB4_CD;
991 else
992 header->hb4 &= ~HB4_CD;
8ef5ada2 993
3a237152 994 if ((nn = process_reply(header, now, server, (size_t)n, check_rebind, no_cache_dnssec, cache_secure,
613ad15d
SK
995 forward->flags & FREC_AD_QUESTION, forward->flags & FREC_DO_QUESTION,
996 forward->flags & FREC_ADDED_PHEADER, forward->flags & FREC_HAS_SUBNET, &forward->source)))
1a6bca81
SK
997 {
998 header->id = htons(forward->orig_id);
572b41eb 999 header->hb4 |= HB4_RA; /* recursion if available */
54dd393f 1000 send_from(forward->fd, option_bool(OPT_NOWILD) || option_bool (OPT_CLEVERBIND), daemon->packet, nn,
50303b19 1001 &forward->source, &forward->dest, forward->iface);
b8187c80 1002 }
1a6bca81 1003 free_frec(forward); /* cancel */
9e4abcb5 1004 }
9e4abcb5 1005}
44a2a316 1006
1a6bca81 1007
5aabfc78 1008void receive_query(struct listener *listen, time_t now)
44a2a316 1009{
572b41eb 1010 struct dns_header *header = (struct dns_header *)daemon->packet;
44a2a316 1011 union mysockaddr source_addr;
c1bb8504 1012 unsigned short type;
44a2a316 1013 struct all_addr dst_addr;
f6b7dc47 1014 struct in_addr netmask, dst_addr_4;
cdeda28f
SK
1015 size_t m;
1016 ssize_t n;
3b195961
VG
1017 int if_index = 0, auth_dns = 0;
1018#ifdef HAVE_AUTH
1019 int local_auth = 0;
1020#endif
44a2a316
SK
1021 struct iovec iov[1];
1022 struct msghdr msg;
1023 struct cmsghdr *cmptr;
44a2a316
SK
1024 union {
1025 struct cmsghdr align; /* this ensures alignment */
1026#ifdef HAVE_IPV6
1027 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
1028#endif
5e9e0efb 1029#if defined(HAVE_LINUX_NETWORK)
44a2a316 1030 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
824af85b
SK
1031#elif defined(IP_RECVDSTADDR) && defined(HAVE_SOLARIS_NETWORK)
1032 char control[CMSG_SPACE(sizeof(struct in_addr)) +
1033 CMSG_SPACE(sizeof(unsigned int))];
44a2a316
SK
1034#elif defined(IP_RECVDSTADDR)
1035 char control[CMSG_SPACE(sizeof(struct in_addr)) +
1036 CMSG_SPACE(sizeof(struct sockaddr_dl))];
1037#endif
1038 } control_u;
2329bef5
SK
1039#ifdef HAVE_IPV6
1040 /* Can always get recvd interface for IPv6 */
1041 int check_dst = !option_bool(OPT_NOWILD) || listen->family == AF_INET6;
1042#else
1043 int check_dst = !option_bool(OPT_NOWILD);
1044#endif
1045
cdeda28f
SK
1046 /* packet buffer overwritten */
1047 daemon->srv_save = NULL;
1048
4f7b304f
SK
1049 dst_addr_4.s_addr = 0;
1050 netmask.s_addr = 0;
1051
7e5664bd 1052 if (option_bool(OPT_NOWILD) && listen->iface)
3d8df260 1053 {
4f7b304f
SK
1054 auth_dns = listen->iface->dns_auth;
1055
1056 if (listen->family == AF_INET)
1057 {
1058 dst_addr_4 = listen->iface->addr.in.sin_addr;
1059 netmask = listen->iface->netmask;
1060 }
3d8df260 1061 }
4f7b304f 1062
3be34541
SK
1063 iov[0].iov_base = daemon->packet;
1064 iov[0].iov_len = daemon->edns_pktsz;
44a2a316
SK
1065
1066 msg.msg_control = control_u.control;
1067 msg.msg_controllen = sizeof(control_u);
1068 msg.msg_flags = 0;
1069 msg.msg_name = &source_addr;
1070 msg.msg_namelen = sizeof(source_addr);
1071 msg.msg_iov = iov;
1072 msg.msg_iovlen = 1;
1073
de37951c 1074 if ((n = recvmsg(listen->fd, &msg, 0)) == -1)
3be34541 1075 return;
44a2a316 1076
572b41eb 1077 if (n < (int)sizeof(struct dns_header) ||
5e9e0efb 1078 (msg.msg_flags & MSG_TRUNC) ||
572b41eb 1079 (header->hb3 & HB3_QR))
26128d27
SK
1080 return;
1081
44a2a316 1082 source_addr.sa.sa_family = listen->family;
2a7a2b84
SK
1083
1084 if (listen->family == AF_INET)
1085 {
1086 /* Source-port == 0 is an error, we can't send back to that.
1087 http://www.ietf.org/mail-archive/web/dnsop/current/msg11441.html */
1088 if (source_addr.in.sin_port == 0)
1089 return;
1090 }
44a2a316 1091#ifdef HAVE_IPV6
2a7a2b84
SK
1092 else
1093 {
1094 /* Source-port == 0 is an error, we can't send back to that. */
1095 if (source_addr.in6.sin6_port == 0)
1096 return;
1097 source_addr.in6.sin6_flowinfo = 0;
1098 }
44a2a316 1099#endif
2a7a2b84 1100
c8a80487
SK
1101 /* We can be configured to only accept queries from at-most-one-hop-away addresses. */
1102 if (option_bool(OPT_LOCAL_SERVICE))
1103 {
1104 struct addrlist *addr;
1105#ifdef HAVE_IPV6
1106 if (listen->family == AF_INET6)
1107 {
1108 for (addr = daemon->interface_addrs; addr; addr = addr->next)
1109 if ((addr->flags & ADDRLIST_IPV6) &&
1110 is_same_net6(&addr->addr.addr.addr6, &source_addr.in6.sin6_addr, addr->prefixlen))
1111 break;
1112 }
1113 else
1114#endif
1115 {
1116 struct in_addr netmask;
1117 for (addr = daemon->interface_addrs; addr; addr = addr->next)
1118 {
1119 netmask.s_addr = 0xffffffff << (32 - addr->prefixlen);
1120 if (!(addr->flags & ADDRLIST_IPV6) &&
1121 is_same_net(addr->addr.addr.addr4, source_addr.in.sin_addr, netmask))
1122 break;
1123 }
1124 }
1125 if (!addr)
1126 {
0c8584ea
SK
1127 static int warned = 0;
1128 if (!warned)
1129 {
1130 my_syslog(LOG_WARNING, _("Ignoring query from non-local network"));
1131 warned = 1;
1132 }
c8a80487
SK
1133 return;
1134 }
1135 }
1136
2329bef5 1137 if (check_dst)
26128d27
SK
1138 {
1139 struct ifreq ifr;
1140
1141 if (msg.msg_controllen < sizeof(struct cmsghdr))
1142 return;
44a2a316 1143
5e9e0efb 1144#if defined(HAVE_LINUX_NETWORK)
26128d27
SK
1145 if (listen->family == AF_INET)
1146 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
c72daea8 1147 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_PKTINFO)
26128d27 1148 {
8ef5ada2
SK
1149 union {
1150 unsigned char *c;
1151 struct in_pktinfo *p;
1152 } p;
1153 p.c = CMSG_DATA(cmptr);
1154 dst_addr_4 = dst_addr.addr.addr4 = p.p->ipi_spec_dst;
1155 if_index = p.p->ipi_ifindex;
26128d27
SK
1156 }
1157#elif defined(IP_RECVDSTADDR) && defined(IP_RECVIF)
1158 if (listen->family == AF_INET)
44a2a316 1159 {
26128d27 1160 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
8ef5ada2
SK
1161 {
1162 union {
1163 unsigned char *c;
1164 unsigned int *i;
1165 struct in_addr *a;
1166#ifndef HAVE_SOLARIS_NETWORK
1167 struct sockaddr_dl *s;
1168#endif
1169 } p;
1170 p.c = CMSG_DATA(cmptr);
1171 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVDSTADDR)
1172 dst_addr_4 = dst_addr.addr.addr4 = *(p.a);
1173 else if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVIF)
824af85b 1174#ifdef HAVE_SOLARIS_NETWORK
8ef5ada2 1175 if_index = *(p.i);
824af85b 1176#else
8ef5ada2 1177 if_index = p.s->sdl_index;
824af85b 1178#endif
8ef5ada2 1179 }
44a2a316 1180 }
44a2a316 1181#endif
26128d27 1182
44a2a316 1183#ifdef HAVE_IPV6
26128d27
SK
1184 if (listen->family == AF_INET6)
1185 {
1186 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
c72daea8 1187 if (cmptr->cmsg_level == IPPROTO_IPV6 && cmptr->cmsg_type == daemon->v6pktinfo)
26128d27 1188 {
8ef5ada2
SK
1189 union {
1190 unsigned char *c;
1191 struct in6_pktinfo *p;
1192 } p;
1193 p.c = CMSG_DATA(cmptr);
1194
1195 dst_addr.addr.addr6 = p.p->ipi6_addr;
1196 if_index = p.p->ipi6_ifindex;
26128d27
SK
1197 }
1198 }
44a2a316 1199#endif
26128d27
SK
1200
1201 /* enforce available interface configuration */
1202
e25db1f2 1203 if (!indextoname(listen->fd, if_index, ifr.ifr_name))
5e9e0efb 1204 return;
832af0ba 1205
e25db1f2
SK
1206 if (!iface_check(listen->family, &dst_addr, ifr.ifr_name, &auth_dns))
1207 {
1208 if (!option_bool(OPT_CLEVERBIND))
115ac3e4 1209 enumerate_interfaces(0);
3f2873d4
SK
1210 if (!loopback_exception(listen->fd, listen->family, &dst_addr, ifr.ifr_name) &&
1211 !label_exception(if_index, listen->family, &dst_addr))
e25db1f2
SK
1212 return;
1213 }
1214
552af8b9
SK
1215 if (listen->family == AF_INET && option_bool(OPT_LOCALISE))
1216 {
1217 struct irec *iface;
1218
1219 /* get the netmask of the interface whch has the address we were sent to.
1220 This is no neccessarily the interface we arrived on. */
1221
1222 for (iface = daemon->interfaces; iface; iface = iface->next)
1223 if (iface->addr.sa.sa_family == AF_INET &&
1224 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
1225 break;
1226
1227 /* interface may be new */
e25db1f2 1228 if (!iface && !option_bool(OPT_CLEVERBIND))
115ac3e4 1229 enumerate_interfaces(0);
552af8b9
SK
1230
1231 for (iface = daemon->interfaces; iface; iface = iface->next)
1232 if (iface->addr.sa.sa_family == AF_INET &&
1233 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
1234 break;
1235
1236 /* If we failed, abandon localisation */
1237 if (iface)
1238 netmask = iface->netmask;
1239 else
1240 dst_addr_4.s_addr = 0;
1241 }
44a2a316
SK
1242 }
1243
cdeda28f 1244 if (extract_request(header, (size_t)n, daemon->namebuff, &type))
44a2a316 1245 {
b485ed97
SK
1246#ifdef HAVE_AUTH
1247 struct auth_zone *zone;
1248#endif
610e782a
SK
1249 char *types = querystr(auth_dns ? "auth" : "query", type);
1250
44a2a316 1251 if (listen->family == AF_INET)
3be34541 1252 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
1a6bca81 1253 (struct all_addr *)&source_addr.in.sin_addr, types);
44a2a316
SK
1254#ifdef HAVE_IPV6
1255 else
3be34541 1256 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
1a6bca81 1257 (struct all_addr *)&source_addr.in6.sin6_addr, types);
44a2a316 1258#endif
44a2a316 1259
b485ed97
SK
1260#ifdef HAVE_AUTH
1261 /* find queries for zones we're authoritative for, and answer them directly */
6008bdbb
SK
1262 if (!auth_dns)
1263 for (zone = daemon->auth_zones; zone; zone = zone->next)
1264 if (in_zone(zone, daemon->namebuff, NULL))
1265 {
1266 auth_dns = 1;
1267 local_auth = 1;
1268 break;
1269 }
b485ed97
SK
1270#endif
1271 }
1272
4820dce9 1273#ifdef HAVE_AUTH
4f7b304f 1274 if (auth_dns)
824af85b 1275 {
60b68069 1276 m = answer_auth(header, ((char *) header) + daemon->packet_buff_sz, (size_t)n, now, &source_addr, local_auth);
4f7b304f 1277 if (m >= 1)
b485ed97
SK
1278 {
1279 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
1280 (char *)header, m, &source_addr, &dst_addr, if_index);
1281 daemon->auth_answer++;
1282 }
824af85b 1283 }
44a2a316 1284 else
4820dce9 1285#endif
4f7b304f 1286 {
613ad15d 1287 int ad_reqd, do_bit;
60b68069 1288 m = answer_request(header, ((char *) header) + daemon->packet_buff_sz, (size_t)n,
613ad15d 1289 dst_addr_4, netmask, now, &ad_reqd, &do_bit);
4f7b304f
SK
1290
1291 if (m >= 1)
1292 {
1293 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
1294 (char *)header, m, &source_addr, &dst_addr, if_index);
1295 daemon->local_answer++;
1296 }
1297 else if (forward_query(listen->fd, &source_addr, &dst_addr, if_index,
613ad15d 1298 header, (size_t)n, now, NULL, ad_reqd, do_bit))
4f7b304f
SK
1299 daemon->queries_forwarded++;
1300 else
1301 daemon->local_answer++;
1302 }
44a2a316
SK
1303}
1304
7d7b7b31 1305#ifdef HAVE_DNSSEC
00a5b5d4
SK
1306
1307/* UDP: we've got an unsigned answer, return STAT_INSECURE if we can prove there's no DS
1308 and therefore the answer shouldn't be signed, or STAT_BOGUS if it should be, or
1309 STAT_NEED_DS_NEG and keyname if we need to do the query. */
1310static int send_check_sign(time_t now, struct dns_header *header, size_t plen, char *name, char *keyname)
1311{
1312 struct crec *crecp;
1313 char *name_start = name;
1314 int status = dnssec_chase_cname(now, header, plen, name, keyname);
1315
1316 if (status != STAT_INSECURE)
1317 return status;
1318
1319 while (1)
1320 {
1321 crecp = cache_find_by_name(NULL, name_start, now, F_DS);
1322
1323 if (crecp && (crecp->flags & F_DNSSECOK))
1324 return (crecp->flags & F_NEG) ? STAT_INSECURE : STAT_BOGUS;
1325
1326 if (crecp && (crecp->flags & F_NEG) && (name_start = strchr(name_start, '.')))
1327 {
1328 name_start++; /* chop a label off and try again */
1329 continue;
1330 }
1331
1332 strcpy(keyname, name_start);
1333 return STAT_NEED_DS_NEG;
1334 }
1335}
1336
1337/* Got answer to DS query from send_check_sign, check for proven non-existence, or make the next DS query to try. */
1338static int do_check_sign(time_t now, struct dns_header *header, size_t plen, char *name, char *keyname, int class)
1339
1340{
1341 char *name_start;
1342 unsigned char *p;
1343 int status = dnssec_validate_ds(now, header, plen, name, keyname, class);
1344
1345 if (status != STAT_INSECURE)
1346 {
1347 if (status == STAT_NO_DS)
1348 status = STAT_INSECURE;
1349 return status;
1350 }
1351
1352 p = (unsigned char *)(header+1);
1353
1354 if (extract_name(header, plen, &p, name, 1, 4) &&
1355 (name_start = strchr(name, '.')))
1356 {
1357 name_start++; /* chop a label off and try again */
1358 strcpy(keyname, name_start);
1359 return STAT_NEED_DS_NEG;
1360 }
1361
1362 return STAT_BOGUS;
1363}
1364
1365/* Move toward the root, until we find a signed non-existance of a DS, in which case
1366 an unsigned answer is OK, or we find a signed DS, in which case there should be
1367 a signature, and the answer is BOGUS */
1368static int tcp_check_for_unsigned_zone(time_t now, struct dns_header *header, size_t plen, int class, char *name,
1369 char *keyname, struct server *server, int *keycount)
1370{
1371 size_t m;
1372 unsigned char *packet, *payload;
1373 u16 *length;
1374 unsigned char *p = (unsigned char *)(header+1);
1375 int status;
1376 char *name_start = name;
1377
1378 /* Get first insecure entry in CNAME chain */
1379 status = tcp_key_recurse(now, STAT_CHASE_CNAME, header, plen, class, name, keyname, server, keycount);
1380 if (status == STAT_BOGUS)
1381 return STAT_BOGUS;
1382
1383 if (!(packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16))))
1384 return STAT_BOGUS;
1385
1386 payload = &packet[2];
1387 header = (struct dns_header *)payload;
1388 length = (u16 *)packet;
1389
1390 while (1)
1391 {
1392 unsigned char *newhash, hash[HASH_SIZE];
1393 unsigned char c1, c2;
1394 struct crec *crecp = cache_find_by_name(NULL, name_start, now, F_DS);
1395
1396 if (--(*keycount) == 0)
1397 return STAT_BOGUS;
1398
1399 if (crecp && (crecp->flags & F_DNSSECOK))
1400 {
1401 free(packet);
1402 return (crecp->flags & F_NEG) ? STAT_INSECURE : STAT_BOGUS;
1403 }
1404
1405 /* If we have cached insecurely that a DS doesn't exist,
1406 ise that is a hit for where to start looking for the secure one */
1407 if (crecp && (crecp->flags & F_NEG) && (name_start = strchr(name_start, '.')))
1408 {
1409 name_start++; /* chop a label off and try again */
1410 continue;
1411 }
1412
1413 m = dnssec_generate_query(header, ((char *) header) + 65536, name_start, class, T_DS, &server->addr);
1414
1415 /* We rely on the question section coming back unchanged, ensure it is with the hash. */
1416 if ((newhash = hash_questions(header, (unsigned int)m, name)))
1417 memcpy(hash, newhash, HASH_SIZE);
1418
1419 *length = htons(m);
1420
1421 if (read_write(server->tcpfd, packet, m + sizeof(u16), 0) &&
1422 read_write(server->tcpfd, &c1, 1, 1) &&
1423 read_write(server->tcpfd, &c2, 1, 1) &&
1424 read_write(server->tcpfd, payload, (c1 << 8) | c2, 1))
1425 {
1426 m = (c1 << 8) | c2;
1427
1428 newhash = hash_questions(header, (unsigned int)m, name);
1429 if (newhash && memcmp(hash, newhash, HASH_SIZE) == 0)
1430 {
1431 /* Note this trashes all three name workspaces */
1432 status = tcp_key_recurse(now, STAT_NEED_DS_NEG, header, m, class, name, keyname, server, keycount);
1433
1434 /* We've found a DS which proves the bit of the DNS where the
1435 original query is, is unsigned, so the answer is OK,
1436 if unvalidated. */
1437 if (status == STAT_NO_DS)
1438 {
1439 free(packet);
1440 return STAT_INSECURE;
1441 }
1442
1443 /* No DS, not got to DNSSEC-land yet, go up. */
1444 if (status == STAT_INSECURE)
1445 {
1446 p = (unsigned char *)(header+1);
1447
1448 if (extract_name(header, plen, &p, name, 1, 4) &&
1449 (name_start = strchr(name, '.')))
1450 {
1451 name_start++; /* chop a label off and try again */
1452 continue;
1453 }
1454 }
1455 }
1456 }
1457
1458 free(packet);
1459
1460 return STAT_BOGUS;
1461 }
1462}
1463
7fa836e1
SK
1464static int tcp_key_recurse(time_t now, int status, struct dns_header *header, size_t n,
1465 int class, char *name, char *keyname, struct server *server, int *keycount)
7d7b7b31
SK
1466{
1467 /* Recurse up the key heirarchy */
7d7b7b31 1468 int new_status;
7d7b7b31 1469
7fa836e1
SK
1470 /* limit the amount of work we do, to avoid cycling forever on loops in the DNS */
1471 if (--(*keycount) == 0)
1472 return STAT_INSECURE;
7d7b7b31 1473
7fa836e1
SK
1474 if (status == STAT_NEED_KEY)
1475 new_status = dnssec_validate_by_ds(now, header, n, name, keyname, class);
00a5b5d4
SK
1476 else if (status == STAT_NEED_DS || status == STAT_NEED_DS_NEG)
1477 {
1478 new_status = dnssec_validate_ds(now, header, n, name, keyname, class);
1479 if (status == STAT_NEED_DS && new_status == STAT_NO_DS)
1480 new_status = STAT_INSECURE;
1481 }
1482 else if (status == STAT_CHASE_CNAME)
1483 new_status = dnssec_chase_cname(now, header, n, name, keyname);
1484 else
1485 {
1486 new_status = dnssec_validate_reply(now, header, n, name, keyname, &class, NULL);
1487
1488 if (new_status == STAT_NO_SIG)
1489 {
1490 if (option_bool(OPT_DNSSEC_NO_SIGN))
1491 new_status = tcp_check_for_unsigned_zone(now, header, n, class, name, keyname, server, keycount);
1492 else
1493 new_status = STAT_INSECURE;
1494 }
1495 }
1496
7fa836e1
SK
1497 /* Can't validate because we need a key/DS whose name now in keyname.
1498 Make query for same, and recurse to validate */
1499 if (new_status == STAT_NEED_DS || new_status == STAT_NEED_KEY)
7d7b7b31 1500 {
7fa836e1
SK
1501 size_t m;
1502 unsigned char *packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16));
1503 unsigned char *payload = &packet[2];
1504 struct dns_header *new_header = (struct dns_header *)payload;
1505 u16 *length = (u16 *)packet;
1506 unsigned char c1, c2;
1507
1508 if (!packet)
1509 return STAT_INSECURE;
1510
1511 another_tcp_key:
1512 m = dnssec_generate_query(new_header, ((char *) new_header) + 65536, keyname, class,
1513 new_status == STAT_NEED_KEY ? T_DNSKEY : T_DS, &server->addr);
7d7b7b31 1514
7fa836e1 1515 *length = htons(m);
7d7b7b31 1516
7fa836e1
SK
1517 if (!read_write(server->tcpfd, packet, m + sizeof(u16), 0) ||
1518 !read_write(server->tcpfd, &c1, 1, 1) ||
1519 !read_write(server->tcpfd, &c2, 1, 1) ||
1520 !read_write(server->tcpfd, payload, (c1 << 8) | c2, 1))
1521 new_status = STAT_INSECURE;
1522 else
7d7b7b31 1523 {
7fa836e1
SK
1524 m = (c1 << 8) | c2;
1525
00a5b5d4
SK
1526 new_status = tcp_key_recurse(now, new_status, new_header, m, class, name, keyname, server, keycount);
1527
1528 if (new_status == STAT_SECURE)
7d7b7b31 1529 {
7fa836e1
SK
1530 /* Reached a validated record, now try again at this level.
1531 Note that we may get ANOTHER NEED_* if an answer needs more than one key.
1532 If so, go round again. */
7d7b7b31 1533
7fa836e1
SK
1534 if (status == STAT_NEED_KEY)
1535 new_status = dnssec_validate_by_ds(now, header, n, name, keyname, class);
00a5b5d4
SK
1536 else if (status == STAT_NEED_DS || status == STAT_NEED_DS_NEG)
1537 {
1538 new_status = dnssec_validate_ds(now, header, n, name, keyname, class);
1539 if (status == STAT_NEED_DS && new_status == STAT_NO_DS)
1540 new_status = STAT_INSECURE; /* Validated no DS */
1541 }
1542 else if (status == STAT_CHASE_CNAME)
1543 new_status = dnssec_chase_cname(now, header, n, name, keyname);
1544 else
1545 {
1546 new_status = dnssec_validate_reply(now, header, n, name, keyname, &class, NULL);
1547
1548 if (new_status == STAT_NO_SIG)
1549 {
1550 if (option_bool(OPT_DNSSEC_NO_SIGN))
1551 new_status = tcp_check_for_unsigned_zone(now, header, n, class, name, keyname, server, keycount);
1552 else
1553 new_status = STAT_INSECURE;
1554 }
1555 }
1556
7d7b7b31 1557 if (new_status == STAT_NEED_DS || new_status == STAT_NEED_KEY)
7fa836e1 1558 goto another_tcp_key;
7d7b7b31
SK
1559 }
1560 }
7d7b7b31 1561
7fa836e1
SK
1562 free(packet);
1563 }
7d7b7b31
SK
1564 return new_status;
1565}
1566#endif
1567
1568
feba5c1d
SK
1569/* The daemon forks before calling this: it should deal with one connection,
1570 blocking as neccessary, and then return. Note, need to be a bit careful
1571 about resources for debug mode, when the fork is suppressed: that's
1572 done by the caller. */
5aabfc78 1573unsigned char *tcp_request(int confd, time_t now,
4f7b304f 1574 union mysockaddr *local_addr, struct in_addr netmask, int auth_dns)
feba5c1d 1575{
28866e95
SK
1576 size_t size = 0;
1577 int norebind = 0;
3b195961 1578#ifdef HAVE_AUTH
19b16891 1579 int local_auth = 0;
3b195961 1580#endif
613ad15d
SK
1581 int checking_disabled, ad_question, do_bit, added_pheader = 0;
1582 int check_subnet, no_cache_dnssec = 0, cache_secure = 0;
cdeda28f 1583 size_t m;
ee86ce68
SK
1584 unsigned short qtype;
1585 unsigned int gotname;
feba5c1d 1586 unsigned char c1, c2;
4b5ea12e
SK
1587 /* Max TCP packet + slop + size */
1588 unsigned char *packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16));
1589 unsigned char *payload = &packet[2];
1590 /* largest field in header is 16-bits, so this is still sufficiently aligned */
1591 struct dns_header *header = (struct dns_header *)payload;
1592 u16 *length = (u16 *)packet;
3be34541 1593 struct server *last_server;
7de060b0
SK
1594 struct in_addr dst_addr_4;
1595 union mysockaddr peer_addr;
1596 socklen_t peer_len = sizeof(union mysockaddr);
3be34541 1597
7de060b0
SK
1598 if (getpeername(confd, (struct sockaddr *)&peer_addr, &peer_len) == -1)
1599 return packet;
c8a80487
SK
1600
1601 /* We can be configured to only accept queries from at-most-one-hop-away addresses. */
1602 if (option_bool(OPT_LOCAL_SERVICE))
1603 {
1604 struct addrlist *addr;
1605#ifdef HAVE_IPV6
1606 if (peer_addr.sa.sa_family == AF_INET6)
1607 {
1608 for (addr = daemon->interface_addrs; addr; addr = addr->next)
1609 if ((addr->flags & ADDRLIST_IPV6) &&
1610 is_same_net6(&addr->addr.addr.addr6, &peer_addr.in6.sin6_addr, addr->prefixlen))
1611 break;
1612 }
1613 else
1614#endif
1615 {
1616 struct in_addr netmask;
1617 for (addr = daemon->interface_addrs; addr; addr = addr->next)
1618 {
1619 netmask.s_addr = 0xffffffff << (32 - addr->prefixlen);
1620 if (!(addr->flags & ADDRLIST_IPV6) &&
1621 is_same_net(addr->addr.addr.addr4, peer_addr.in.sin_addr, netmask))
1622 break;
1623 }
1624 }
1625 if (!addr)
1626 {
1627 my_syslog(LOG_WARNING, _("Ignoring query from non-local network"));
1628 return packet;
1629 }
1630 }
7de060b0 1631
feba5c1d
SK
1632 while (1)
1633 {
1634 if (!packet ||
1635 !read_write(confd, &c1, 1, 1) || !read_write(confd, &c2, 1, 1) ||
1636 !(size = c1 << 8 | c2) ||
4b5ea12e 1637 !read_write(confd, payload, size, 1))
feba5c1d
SK
1638 return packet;
1639
572b41eb 1640 if (size < (int)sizeof(struct dns_header))
feba5c1d
SK
1641 continue;
1642
ed4c0767
SK
1643 check_subnet = 0;
1644
28866e95 1645 /* save state of "cd" flag in query */
7d7b7b31
SK
1646 if ((checking_disabled = header->hb4 & HB4_CD))
1647 no_cache_dnssec = 1;
28866e95 1648
3be34541 1649 if ((gotname = extract_request(header, (unsigned int)size, daemon->namebuff, &qtype)))
feba5c1d 1650 {
b485ed97
SK
1651#ifdef HAVE_AUTH
1652 struct auth_zone *zone;
1653#endif
610e782a 1654 char *types = querystr(auth_dns ? "auth" : "query", qtype);
7de060b0
SK
1655
1656 if (peer_addr.sa.sa_family == AF_INET)
1657 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
1658 (struct all_addr *)&peer_addr.in.sin_addr, types);
feba5c1d 1659#ifdef HAVE_IPV6
7de060b0
SK
1660 else
1661 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
1662 (struct all_addr *)&peer_addr.in6.sin6_addr, types);
feba5c1d 1663#endif
b485ed97
SK
1664
1665#ifdef HAVE_AUTH
1666 /* find queries for zones we're authoritative for, and answer them directly */
6008bdbb
SK
1667 if (!auth_dns)
1668 for (zone = daemon->auth_zones; zone; zone = zone->next)
1669 if (in_zone(zone, daemon->namebuff, NULL))
1670 {
1671 auth_dns = 1;
1672 local_auth = 1;
1673 break;
1674 }
b485ed97 1675#endif
feba5c1d
SK
1676 }
1677
7de060b0
SK
1678 if (local_addr->sa.sa_family == AF_INET)
1679 dst_addr_4 = local_addr->in.sin_addr;
1680 else
1681 dst_addr_4.s_addr = 0;
1682
4820dce9 1683#ifdef HAVE_AUTH
4f7b304f 1684 if (auth_dns)
19b16891 1685 m = answer_auth(header, ((char *) header) + 65536, (size_t)size, now, &peer_addr, local_auth);
4f7b304f 1686 else
4820dce9 1687#endif
feba5c1d 1688 {
4f7b304f
SK
1689 /* m > 0 if answered from cache */
1690 m = answer_request(header, ((char *) header) + 65536, (size_t)size,
613ad15d 1691 dst_addr_4, netmask, now, &ad_question, &do_bit);
feba5c1d 1692
4f7b304f
SK
1693 /* Do this by steam now we're not in the select() loop */
1694 check_log_writer(NULL);
1695
1696 if (m == 0)
feba5c1d 1697 {
4f7b304f
SK
1698 unsigned int flags = 0;
1699 struct all_addr *addrp = NULL;
1700 int type = 0;
1701 char *domain = NULL;
feba5c1d 1702
4f7b304f
SK
1703 if (option_bool(OPT_ADD_MAC))
1704 size = add_mac(header, size, ((char *) header) + 65536, &peer_addr);
ed4c0767
SK
1705
1706 if (option_bool(OPT_CLIENT_SUBNET))
1707 {
1708 size_t new = add_source_addr(header, size, ((char *) header) + 65536, &peer_addr);
1709 if (size != new)
1710 {
1711 size = new;
1712 check_subnet = 1;
1713 }
1714 }
1715
4f7b304f
SK
1716 if (gotname)
1717 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
1718
1719 if (type != 0 || option_bool(OPT_ORDER) || !daemon->last_server)
1720 last_server = daemon->servers;
1721 else
1722 last_server = daemon->last_server;
1723
1724 if (!flags && last_server)
1725 {
1726 struct server *firstsendto = NULL;
8a9be9e4 1727#ifdef HAVE_DNSSEC
703c7ff4 1728 unsigned char *newhash, hash[HASH_SIZE];
8a9be9e4
SK
1729 if ((newhash = hash_questions(header, (unsigned int)size, daemon->keyname)))
1730 memcpy(hash, newhash, HASH_SIZE);
1731#else
4f7b304f 1732 unsigned int crc = questions_crc(header, (unsigned int)size, daemon->namebuff);
8a9be9e4 1733#endif
4f7b304f
SK
1734 /* Loop round available servers until we succeed in connecting to one.
1735 Note that this code subtley ensures that consecutive queries on this connection
1736 which can go to the same server, do so. */
1737 while (1)
feba5c1d 1738 {
4f7b304f
SK
1739 if (!firstsendto)
1740 firstsendto = last_server;
1741 else
1742 {
1743 if (!(last_server = last_server->next))
1744 last_server = daemon->servers;
1745
1746 if (last_server == firstsendto)
1747 break;
1748 }
1749
1750 /* server for wrong domain */
1751 if (type != (last_server->flags & SERV_TYPE) ||
1752 (type == SERV_HAS_DOMAIN && !hostname_isequal(domain, last_server->domain)))
7de060b0
SK
1753 continue;
1754
4f7b304f 1755 if (last_server->tcpfd == -1)
7de060b0 1756 {
4f7b304f
SK
1757 if ((last_server->tcpfd = socket(last_server->addr.sa.sa_family, SOCK_STREAM, 0)) == -1)
1758 continue;
1759
1760 if ((!local_bind(last_server->tcpfd, &last_server->source_addr, last_server->interface, 1) ||
1761 connect(last_server->tcpfd, &last_server->addr.sa, sa_len(&last_server->addr)) == -1))
1762 {
1763 close(last_server->tcpfd);
1764 last_server->tcpfd = -1;
1765 continue;
1766 }
1767
7d7b7b31
SK
1768#ifdef HAVE_DNSSEC
1769 if (option_bool(OPT_DNSSEC_VALID))
1770 {
613ad15d
SK
1771 size_t new_size = add_do_bit(header, size, ((char *) header) + 65536);
1772
2ecd9bd5
SK
1773 /* For debugging, set Checking Disabled, otherwise, have the upstream check too,
1774 this allows it to select auth servers when one is returning bad data. */
1775 if (option_bool(OPT_DNSSEC_DEBUG))
1776 header->hb4 |= HB4_CD;
613ad15d
SK
1777
1778 if (size != new_size)
1779 added_pheader = 1;
1780
1781 size = new_size;
7d7b7b31
SK
1782 }
1783#endif
1784
7de060b0 1785#ifdef HAVE_CONNTRACK
4f7b304f
SK
1786 /* Copy connection mark of incoming query to outgoing connection. */
1787 if (option_bool(OPT_CONNTRACK))
1788 {
1789 unsigned int mark;
1790 struct all_addr local;
7de060b0 1791#ifdef HAVE_IPV6
4f7b304f
SK
1792 if (local_addr->sa.sa_family == AF_INET6)
1793 local.addr.addr6 = local_addr->in6.sin6_addr;
1794 else
7de060b0 1795#endif
4f7b304f
SK
1796 local.addr.addr4 = local_addr->in.sin_addr;
1797
1798 if (get_incoming_mark(&peer_addr, &local, 1, &mark))
1799 setsockopt(last_server->tcpfd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
1800 }
7de060b0 1801#endif
4f7b304f
SK
1802 }
1803
4b5ea12e 1804 *length = htons(size);
4f7b304f 1805
4b5ea12e 1806 if (!read_write(last_server->tcpfd, packet, size + sizeof(u16), 0) ||
4f7b304f 1807 !read_write(last_server->tcpfd, &c1, 1, 1) ||
7d7b7b31
SK
1808 !read_write(last_server->tcpfd, &c2, 1, 1) ||
1809 !read_write(last_server->tcpfd, payload, (c1 << 8) | c2, 1))
4f7b304f
SK
1810 {
1811 close(last_server->tcpfd);
1812 last_server->tcpfd = -1;
1813 continue;
1814 }
1815
1816 m = (c1 << 8) | c2;
4f7b304f
SK
1817
1818 if (!gotname)
1819 strcpy(daemon->namebuff, "query");
1820 if (last_server->addr.sa.sa_family == AF_INET)
1821 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
1822 (struct all_addr *)&last_server->addr.in.sin_addr, NULL);
feba5c1d 1823#ifdef HAVE_IPV6
4f7b304f
SK
1824 else
1825 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
1826 (struct all_addr *)&last_server->addr.in6.sin6_addr, NULL);
feba5c1d 1827#endif
7d7b7b31
SK
1828
1829#ifdef HAVE_DNSSEC
1830 if (option_bool(OPT_DNSSEC_VALID) && !checking_disabled)
1831 {
7fa836e1
SK
1832 int keycount = DNSSEC_WORK; /* Limit to number of DNSSEC questions, to catch loops and avoid filling cache. */
1833 int status = tcp_key_recurse(now, STAT_TRUNCATED, header, m, 0, daemon->namebuff, daemon->keyname, last_server, &keycount);
1834 char *result;
1835
1836 if (keycount == 0)
1837 result = "ABANDONED";
1838 else
1839 result = (status == STAT_SECURE ? "SECURE" : (status == STAT_INSECURE ? "INSECURE" : "BOGUS"));
7d7b7b31 1840
7fa836e1 1841 log_query(F_KEYTAG | F_SECSTAT, "result", NULL, result);
7d7b7b31 1842
7d7b7b31
SK
1843 if (status == STAT_BOGUS)
1844 no_cache_dnssec = 1;
7fa836e1 1845
7d7b7b31
SK
1846 if (status == STAT_SECURE)
1847 cache_secure = 1;
1848 }
1849#endif
1850
1851 /* restore CD bit to the value in the query */
1852 if (checking_disabled)
1853 header->hb4 |= HB4_CD;
1854 else
1855 header->hb4 &= ~HB4_CD;
4f7b304f
SK
1856
1857 /* There's no point in updating the cache, since this process will exit and
1858 lose the information after a few queries. We make this call for the alias and
1859 bogus-nxdomain side-effects. */
1860 /* If the crc of the question section doesn't match the crc we sent, then
1861 someone might be attempting to insert bogus values into the cache by
1862 sending replies containing questions and bogus answers. */
8a9be9e4
SK
1863#ifdef HAVE_DNSSEC
1864 newhash = hash_questions(header, (unsigned int)m, daemon->namebuff);
1865 if (!newhash || memcmp(hash, newhash, HASH_SIZE) != 0)
703c7ff4
SK
1866 {
1867 m = 0;
1868 break;
1869 }
8a9be9e4
SK
1870#else
1871 if (crc != questions_crc(header, (unsigned int)m, daemon->namebuff))
703c7ff4
SK
1872 {
1873 m = 0;
1874 break;
1875 }
8a9be9e4
SK
1876#endif
1877
1878 m = process_reply(header, now, last_server, (unsigned int)m,
1879 option_bool(OPT_NO_REBIND) && !norebind, no_cache_dnssec,
613ad15d 1880 cache_secure, ad_question, do_bit, added_pheader, check_subnet, &peer_addr);
4f7b304f
SK
1881
1882 break;
1883 }
feba5c1d 1884 }
4f7b304f
SK
1885
1886 /* In case of local answer or no connections made. */
1887 if (m == 0)
1888 m = setup_reply(header, (unsigned int)size, addrp, flags, daemon->local_ttl);
feba5c1d 1889 }
feba5c1d 1890 }
4f7b304f 1891
5aabfc78 1892 check_log_writer(NULL);
feba5c1d 1893
4b5ea12e
SK
1894 *length = htons(m);
1895
1896 if (m == 0 || !read_write(confd, packet, m + sizeof(u16), 0))
feba5c1d
SK
1897 return packet;
1898 }
1899}
1900
1697269c 1901static struct frec *allocate_frec(time_t now)
9e4abcb5 1902{
1697269c
SK
1903 struct frec *f;
1904
5aabfc78 1905 if ((f = (struct frec *)whine_malloc(sizeof(struct frec))))
9e4abcb5 1906 {
1a6bca81 1907 f->next = daemon->frec_list;
1697269c 1908 f->time = now;
832af0ba 1909 f->sentto = NULL;
1a6bca81 1910 f->rfd4 = NULL;
28866e95 1911 f->flags = 0;
1a6bca81
SK
1912#ifdef HAVE_IPV6
1913 f->rfd6 = NULL;
3a237152
SK
1914#endif
1915#ifdef HAVE_DNSSEC
97bc798b 1916 f->dependent = NULL;
3a237152 1917 f->blocking_query = NULL;
4619d946 1918 f->stash = NULL;
1a6bca81
SK
1919#endif
1920 daemon->frec_list = f;
1697269c 1921 }
9e4abcb5 1922
1697269c
SK
1923 return f;
1924}
9e4abcb5 1925
1a6bca81
SK
1926static struct randfd *allocate_rfd(int family)
1927{
1928 static int finger = 0;
1929 int i;
1930
1931 /* limit the number of sockets we have open to avoid starvation of
1932 (eg) TFTP. Once we have a reasonable number, randomness should be OK */
1933
1934 for (i = 0; i < RANDOM_SOCKS; i++)
9009d746 1935 if (daemon->randomsocks[i].refcount == 0)
1a6bca81 1936 {
9009d746
SK
1937 if ((daemon->randomsocks[i].fd = random_sock(family)) == -1)
1938 break;
1939
1a6bca81
SK
1940 daemon->randomsocks[i].refcount = 1;
1941 daemon->randomsocks[i].family = family;
1942 return &daemon->randomsocks[i];
1943 }
1944
9009d746 1945 /* No free ones or cannot get new socket, grab an existing one */
1a6bca81
SK
1946 for (i = 0; i < RANDOM_SOCKS; i++)
1947 {
1948 int j = (i+finger) % RANDOM_SOCKS;
9009d746
SK
1949 if (daemon->randomsocks[j].refcount != 0 &&
1950 daemon->randomsocks[j].family == family &&
1951 daemon->randomsocks[j].refcount != 0xffff)
1a6bca81
SK
1952 {
1953 finger = j;
1954 daemon->randomsocks[j].refcount++;
1955 return &daemon->randomsocks[j];
1956 }
1957 }
1958
1959 return NULL; /* doom */
1960}
1a6bca81
SK
1961static void free_frec(struct frec *f)
1962{
1963 if (f->rfd4 && --(f->rfd4->refcount) == 0)
1964 close(f->rfd4->fd);
1965
1966 f->rfd4 = NULL;
1967 f->sentto = NULL;
28866e95 1968 f->flags = 0;
1a6bca81
SK
1969
1970#ifdef HAVE_IPV6
1971 if (f->rfd6 && --(f->rfd6->refcount) == 0)
1972 close(f->rfd6->fd);
1973
1974 f->rfd6 = NULL;
1975#endif
3a237152
SK
1976
1977#ifdef HAVE_DNSSEC
1978 if (f->stash)
0fc2f313
SK
1979 {
1980 blockdata_free(f->stash);
1981 f->stash = NULL;
1982 }
3a237152
SK
1983
1984 /* Anything we're waiting on is pointless now, too */
1985 if (f->blocking_query)
1986 free_frec(f->blocking_query);
1987 f->blocking_query = NULL;
39048ad1 1988 f->dependent = NULL;
3a237152 1989#endif
1a6bca81
SK
1990}
1991
1697269c
SK
1992/* if wait==NULL return a free or older than TIMEOUT record.
1993 else return *wait zero if one available, or *wait is delay to
1a6bca81 1994 when the oldest in-use record will expire. Impose an absolute
3a237152
SK
1995 limit of 4*TIMEOUT before we wipe things (for random sockets).
1996 If force is set, always return a result, even if we have
1997 to allocate above the limit. */
1998struct frec *get_new_frec(time_t now, int *wait, int force)
1697269c 1999{
1a6bca81 2000 struct frec *f, *oldest, *target;
1697269c
SK
2001 int count;
2002
2003 if (wait)
2004 *wait = 0;
2005
1a6bca81 2006 for (f = daemon->frec_list, oldest = NULL, target = NULL, count = 0; f; f = f->next, count++)
832af0ba 2007 if (!f->sentto)
1a6bca81
SK
2008 target = f;
2009 else
1697269c 2010 {
1a6bca81
SK
2011 if (difftime(now, f->time) >= 4*TIMEOUT)
2012 {
2013 free_frec(f);
2014 target = f;
2015 }
2016
2017 if (!oldest || difftime(f->time, oldest->time) <= 0)
2018 oldest = f;
1697269c 2019 }
1a6bca81
SK
2020
2021 if (target)
2022 {
2023 target->time = now;
2024 return target;
2025 }
9e4abcb5
SK
2026
2027 /* can't find empty one, use oldest if there is one
2028 and it's older than timeout */
1697269c 2029 if (oldest && ((int)difftime(now, oldest->time)) >= TIMEOUT)
9e4abcb5 2030 {
1697269c
SK
2031 /* keep stuff for twice timeout if we can by allocating a new
2032 record instead */
2033 if (difftime(now, oldest->time) < 2*TIMEOUT &&
2034 count <= daemon->ftabsize &&
2035 (f = allocate_frec(now)))
2036 return f;
2037
2038 if (!wait)
2039 {
1a6bca81 2040 free_frec(oldest);
1697269c
SK
2041 oldest->time = now;
2042 }
9e4abcb5
SK
2043 return oldest;
2044 }
2045
1697269c 2046 /* none available, calculate time 'till oldest record expires */
3a237152 2047 if (!force && count > daemon->ftabsize)
1697269c 2048 {
0da5e897
MSB
2049 static time_t last_log = 0;
2050
1697269c
SK
2051 if (oldest && wait)
2052 *wait = oldest->time + (time_t)TIMEOUT - now;
0da5e897
MSB
2053
2054 if ((int)difftime(now, last_log) > 5)
2055 {
2056 last_log = now;
2057 my_syslog(LOG_WARNING, _("Maximum number of concurrent DNS queries reached (max: %d)"), daemon->ftabsize);
2058 }
2059
9e4abcb5
SK
2060 return NULL;
2061 }
1697269c
SK
2062
2063 if (!(f = allocate_frec(now)) && wait)
2064 /* wait one second on malloc failure */
2065 *wait = 1;
9e4abcb5 2066
9e4abcb5
SK
2067 return f; /* OK if malloc fails and this is NULL */
2068}
2069
832af0ba 2070/* crc is all-ones if not known. */
8a9be9e4 2071static struct frec *lookup_frec(unsigned short id, void *hash)
9e4abcb5
SK
2072{
2073 struct frec *f;
2074
1a6bca81 2075 for(f = daemon->frec_list; f; f = f->next)
832af0ba 2076 if (f->sentto && f->new_id == id &&
8a9be9e4 2077 (!hash || memcmp(hash, f->hash, HASH_SIZE) == 0))
9e4abcb5
SK
2078 return f;
2079
2080 return NULL;
2081}
2082
2083static struct frec *lookup_frec_by_sender(unsigned short id,
fd9fa481 2084 union mysockaddr *addr,
8a9be9e4 2085 void *hash)
9e4abcb5 2086{
feba5c1d
SK
2087 struct frec *f;
2088
1a6bca81 2089 for(f = daemon->frec_list; f; f = f->next)
832af0ba 2090 if (f->sentto &&
9e4abcb5 2091 f->orig_id == id &&
8a9be9e4 2092 memcmp(hash, f->hash, HASH_SIZE) == 0 &&
9e4abcb5
SK
2093 sockaddr_isequal(&f->source, addr))
2094 return f;
2095
2096 return NULL;
2097}
2098
849a8357 2099/* A server record is going away, remove references to it */
5aabfc78 2100void server_gone(struct server *server)
849a8357
SK
2101{
2102 struct frec *f;
2103
1a6bca81 2104 for (f = daemon->frec_list; f; f = f->next)
832af0ba 2105 if (f->sentto && f->sentto == server)
1a6bca81 2106 free_frec(f);
849a8357
SK
2107
2108 if (daemon->last_server == server)
2109 daemon->last_server = NULL;
2110
2111 if (daemon->srv_save == server)
2112 daemon->srv_save = NULL;
2113}
9e4abcb5 2114
316e2730 2115/* return unique random ids. */
8a9be9e4 2116static unsigned short get_id(void)
9e4abcb5
SK
2117{
2118 unsigned short ret = 0;
832af0ba 2119
316e2730 2120 do
832af0ba 2121 ret = rand16();
8a9be9e4 2122 while (lookup_frec(ret, NULL));
832af0ba 2123
9e4abcb5
SK
2124 return ret;
2125}
2126
2127
2128
2129
2130