]> git.ipfire.org Git - people/ms/dnsmasq.git/blob - src/forward.c
Don't filter by subnet when handling local queries for auth-zones.
[people/ms/dnsmasq.git] / src / forward.c
1 /* dnsmasq is Copyright (c) 2000-2013 Simon Kelley
2
3 This program is free software; you can redistribute it and/or modify
4 it under the terms of the GNU General Public License as published by
5 the Free Software Foundation; version 2 dated June, 1991, or
6 (at your option) version 3 dated 29 June, 2007.
7
8 This program is distributed in the hope that it will be useful,
9 but WITHOUT ANY WARRANTY; without even the implied warranty of
10 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11 GNU General Public License for more details.
12
13 You should have received a copy of the GNU General Public License
14 along with this program. If not, see <http://www.gnu.org/licenses/>.
15 */
16
17 #include "dnsmasq.h"
18
19 static struct frec *lookup_frec(unsigned short id, unsigned int crc);
20 static struct frec *lookup_frec_by_sender(unsigned short id,
21 union mysockaddr *addr,
22 unsigned int crc);
23 static unsigned short get_id(unsigned int crc);
24 static void free_frec(struct frec *f);
25 static struct randfd *allocate_rfd(int family);
26
27 /* Send a UDP packet with its source address set as "source"
28 unless nowild is true, when we just send it with the kernel default */
29 int send_from(int fd, int nowild, char *packet, size_t len,
30 union mysockaddr *to, struct all_addr *source,
31 unsigned int iface)
32 {
33 struct msghdr msg;
34 struct iovec iov[1];
35 union {
36 struct cmsghdr align; /* this ensures alignment */
37 #if defined(HAVE_LINUX_NETWORK)
38 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
39 #elif defined(IP_SENDSRCADDR)
40 char control[CMSG_SPACE(sizeof(struct in_addr))];
41 #endif
42 #ifdef HAVE_IPV6
43 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
44 #endif
45 } control_u;
46
47 iov[0].iov_base = packet;
48 iov[0].iov_len = len;
49
50 msg.msg_control = NULL;
51 msg.msg_controllen = 0;
52 msg.msg_flags = 0;
53 msg.msg_name = to;
54 msg.msg_namelen = sa_len(to);
55 msg.msg_iov = iov;
56 msg.msg_iovlen = 1;
57
58 if (!nowild)
59 {
60 struct cmsghdr *cmptr;
61 msg.msg_control = &control_u;
62 msg.msg_controllen = sizeof(control_u);
63 cmptr = CMSG_FIRSTHDR(&msg);
64
65 if (to->sa.sa_family == AF_INET)
66 {
67 #if defined(HAVE_LINUX_NETWORK)
68 struct in_pktinfo p;
69 p.ipi_ifindex = 0;
70 p.ipi_spec_dst = source->addr.addr4;
71 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
72 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_pktinfo));
73 cmptr->cmsg_level = IPPROTO_IP;
74 cmptr->cmsg_type = IP_PKTINFO;
75 #elif defined(IP_SENDSRCADDR)
76 memcpy(CMSG_DATA(cmptr), &(source->addr.addr4), sizeof(source->addr.addr4));
77 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_addr));
78 cmptr->cmsg_level = IPPROTO_IP;
79 cmptr->cmsg_type = IP_SENDSRCADDR;
80 #endif
81 }
82 else
83 #ifdef HAVE_IPV6
84 {
85 struct in6_pktinfo p;
86 p.ipi6_ifindex = iface; /* Need iface for IPv6 to handle link-local addrs */
87 p.ipi6_addr = source->addr.addr6;
88 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
89 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in6_pktinfo));
90 cmptr->cmsg_type = daemon->v6pktinfo;
91 cmptr->cmsg_level = IPPROTO_IPV6;
92 }
93 #else
94 (void)iface; /* eliminate warning */
95 #endif
96 }
97
98 while (sendmsg(fd, &msg, 0) == -1)
99 {
100 if (retry_send())
101 continue;
102
103 /* If interface is still in DAD, EINVAL results - ignore that. */
104 if (errno == EINVAL)
105 break;
106
107 my_syslog(LOG_ERR, _("failed to send packet: %s"), strerror(errno));
108 return 0;
109 }
110
111 return 1;
112 }
113
114 static unsigned int search_servers(time_t now, struct all_addr **addrpp,
115 unsigned int qtype, char *qdomain, int *type, char **domain, int *norebind)
116
117 {
118 /* If the query ends in the domain in one of our servers, set
119 domain to point to that name. We find the largest match to allow both
120 domain.org and sub.domain.org to exist. */
121
122 unsigned int namelen = strlen(qdomain);
123 unsigned int matchlen = 0;
124 struct server *serv;
125 unsigned int flags = 0;
126
127 for (serv = daemon->servers; serv; serv=serv->next)
128 /* domain matches take priority over NODOTS matches */
129 if ((serv->flags & SERV_FOR_NODOTS) && *type != SERV_HAS_DOMAIN && !strchr(qdomain, '.') && namelen != 0)
130 {
131 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
132 *type = SERV_FOR_NODOTS;
133 if (serv->flags & SERV_NO_ADDR)
134 flags = F_NXDOMAIN;
135 else if (serv->flags & SERV_LITERAL_ADDRESS)
136 {
137 if (sflag & qtype)
138 {
139 flags = sflag;
140 if (serv->addr.sa.sa_family == AF_INET)
141 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
142 #ifdef HAVE_IPV6
143 else
144 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
145 #endif
146 }
147 else if (!flags || (flags & F_NXDOMAIN))
148 flags = F_NOERR;
149 }
150 }
151 else if (serv->flags & SERV_HAS_DOMAIN)
152 {
153 unsigned int domainlen = strlen(serv->domain);
154 char *matchstart = qdomain + namelen - domainlen;
155 if (namelen >= domainlen &&
156 hostname_isequal(matchstart, serv->domain) &&
157 (domainlen == 0 || namelen == domainlen || *(matchstart-1) == '.' ))
158 {
159 if (serv->flags & SERV_NO_REBIND)
160 *norebind = 1;
161 else
162 {
163 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
164 /* implement priority rules for --address and --server for same domain.
165 --address wins if the address is for the correct AF
166 --server wins otherwise. */
167 if (domainlen != 0 && domainlen == matchlen)
168 {
169 if ((serv->flags & SERV_LITERAL_ADDRESS))
170 {
171 if (!(sflag & qtype) && flags == 0)
172 continue;
173 }
174 else
175 {
176 if (flags & (F_IPV4 | F_IPV6))
177 continue;
178 }
179 }
180
181 if (domainlen >= matchlen)
182 {
183 *type = serv->flags & (SERV_HAS_DOMAIN | SERV_USE_RESOLV | SERV_NO_REBIND);
184 *domain = serv->domain;
185 matchlen = domainlen;
186 if (serv->flags & SERV_NO_ADDR)
187 flags = F_NXDOMAIN;
188 else if (serv->flags & SERV_LITERAL_ADDRESS)
189 {
190 if (sflag & qtype)
191 {
192 flags = sflag;
193 if (serv->addr.sa.sa_family == AF_INET)
194 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
195 #ifdef HAVE_IPV6
196 else
197 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
198 #endif
199 }
200 else if (!flags || (flags & F_NXDOMAIN))
201 flags = F_NOERR;
202 }
203 else
204 flags = 0;
205 }
206 }
207 }
208 }
209
210 if (flags == 0 && !(qtype & F_QUERY) &&
211 option_bool(OPT_NODOTS_LOCAL) && !strchr(qdomain, '.') && namelen != 0)
212 /* don't forward A or AAAA queries for simple names, except the empty name */
213 flags = F_NOERR;
214
215 if (flags == F_NXDOMAIN && check_for_local_domain(qdomain, now))
216 flags = F_NOERR;
217
218 if (flags)
219 {
220 int logflags = 0;
221
222 if (flags == F_NXDOMAIN || flags == F_NOERR)
223 logflags = F_NEG | qtype;
224
225 log_query(logflags | flags | F_CONFIG | F_FORWARD, qdomain, *addrpp, NULL);
226 }
227 else if ((*type) & SERV_USE_RESOLV)
228 {
229 *type = 0; /* use normal servers for this domain */
230 *domain = NULL;
231 }
232 return flags;
233 }
234
235 static int forward_query(int udpfd, union mysockaddr *udpaddr,
236 struct all_addr *dst_addr, unsigned int dst_iface,
237 struct dns_header *header, size_t plen, time_t now, struct frec *forward)
238 {
239 char *domain = NULL;
240 int type = 0, norebind = 0;
241 struct all_addr *addrp = NULL;
242 unsigned int crc = questions_crc(header, plen, daemon->namebuff);
243 unsigned int flags = 0;
244 unsigned int gotname = extract_request(header, plen, daemon->namebuff, NULL);
245 struct server *start = NULL;
246
247 /* RFC 4035: sect 4.6 para 2 */
248 header->hb4 &= ~HB4_AD;
249
250 /* may be no servers available. */
251 if (!daemon->servers)
252 forward = NULL;
253 else if (forward || (forward = lookup_frec_by_sender(ntohs(header->id), udpaddr, crc)))
254 {
255 /* retry on existing query, send to all available servers */
256 domain = forward->sentto->domain;
257 forward->sentto->failed_queries++;
258 if (!option_bool(OPT_ORDER))
259 {
260 forward->forwardall = 1;
261 daemon->last_server = NULL;
262 }
263 type = forward->sentto->flags & SERV_TYPE;
264 if (!(start = forward->sentto->next))
265 start = daemon->servers; /* at end of list, recycle */
266 header->id = htons(forward->new_id);
267 }
268 else
269 {
270 if (gotname)
271 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
272
273 if (!flags && !(forward = get_new_frec(now, NULL)))
274 /* table full - server failure. */
275 flags = F_NEG;
276
277 if (forward)
278 {
279 forward->source = *udpaddr;
280 forward->dest = *dst_addr;
281 forward->iface = dst_iface;
282 forward->orig_id = ntohs(header->id);
283 forward->new_id = get_id(crc);
284 forward->fd = udpfd;
285 forward->crc = crc;
286 forward->forwardall = 0;
287 forward->flags = 0;
288 if (norebind)
289 forward->flags |= FREC_NOREBIND;
290 if (header->hb4 & HB4_CD)
291 forward->flags |= FREC_CHECKING_DISABLED;
292
293 header->id = htons(forward->new_id);
294
295 /* In strict_order mode, always try servers in the order
296 specified in resolv.conf, if a domain is given
297 always try all the available servers,
298 otherwise, use the one last known to work. */
299
300 if (type == 0)
301 {
302 if (option_bool(OPT_ORDER))
303 start = daemon->servers;
304 else if (!(start = daemon->last_server) ||
305 daemon->forwardcount++ > FORWARD_TEST ||
306 difftime(now, daemon->forwardtime) > FORWARD_TIME)
307 {
308 start = daemon->servers;
309 forward->forwardall = 1;
310 daemon->forwardcount = 0;
311 daemon->forwardtime = now;
312 }
313 }
314 else
315 {
316 start = daemon->servers;
317 if (!option_bool(OPT_ORDER))
318 forward->forwardall = 1;
319 }
320 }
321 }
322
323 /* check for send errors here (no route to host)
324 if we fail to send to all nameservers, send back an error
325 packet straight away (helps modem users when offline) */
326
327 if (!flags && forward)
328 {
329 struct server *firstsentto = start;
330 int forwarded = 0;
331
332 if (option_bool(OPT_ADD_MAC))
333 plen = add_mac(header, plen, ((char *) header) + PACKETSZ, &forward->source);
334
335 if (option_bool(OPT_CLIENT_SUBNET))
336 {
337 size_t new = add_source_addr(header, plen, ((char *) header) + PACKETSZ, &forward->source);
338 if (new != plen)
339 {
340 plen = new;
341 forward->flags |= FREC_HAS_SUBNET;
342 }
343 }
344
345 while (1)
346 {
347 /* only send to servers dealing with our domain.
348 domain may be NULL, in which case server->domain
349 must be NULL also. */
350
351 if (type == (start->flags & SERV_TYPE) &&
352 (type != SERV_HAS_DOMAIN || hostname_isequal(domain, start->domain)) &&
353 !(start->flags & SERV_LITERAL_ADDRESS))
354 {
355 int fd;
356
357 /* find server socket to use, may need to get random one. */
358 if (start->sfd)
359 fd = start->sfd->fd;
360 else
361 {
362 #ifdef HAVE_IPV6
363 if (start->addr.sa.sa_family == AF_INET6)
364 {
365 if (!forward->rfd6 &&
366 !(forward->rfd6 = allocate_rfd(AF_INET6)))
367 break;
368 daemon->rfd_save = forward->rfd6;
369 fd = forward->rfd6->fd;
370 }
371 else
372 #endif
373 {
374 if (!forward->rfd4 &&
375 !(forward->rfd4 = allocate_rfd(AF_INET)))
376 break;
377 daemon->rfd_save = forward->rfd4;
378 fd = forward->rfd4->fd;
379 }
380
381 #ifdef HAVE_CONNTRACK
382 /* Copy connection mark of incoming query to outgoing connection. */
383 if (option_bool(OPT_CONNTRACK))
384 {
385 unsigned int mark;
386 if (get_incoming_mark(&forward->source, &forward->dest, 0, &mark))
387 setsockopt(fd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
388 }
389 #endif
390 }
391
392 if (sendto(fd, (char *)header, plen, 0,
393 &start->addr.sa,
394 sa_len(&start->addr)) == -1)
395 {
396 if (retry_send())
397 continue;
398 }
399 else
400 {
401 /* Keep info in case we want to re-send this packet */
402 daemon->srv_save = start;
403 daemon->packet_len = plen;
404
405 if (!gotname)
406 strcpy(daemon->namebuff, "query");
407 if (start->addr.sa.sa_family == AF_INET)
408 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
409 (struct all_addr *)&start->addr.in.sin_addr, NULL);
410 #ifdef HAVE_IPV6
411 else
412 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
413 (struct all_addr *)&start->addr.in6.sin6_addr, NULL);
414 #endif
415 start->queries++;
416 forwarded = 1;
417 forward->sentto = start;
418 if (!forward->forwardall)
419 break;
420 forward->forwardall++;
421 }
422 }
423
424 if (!(start = start->next))
425 start = daemon->servers;
426
427 if (start == firstsentto)
428 break;
429 }
430
431 if (forwarded)
432 return 1;
433
434 /* could not send on, prepare to return */
435 header->id = htons(forward->orig_id);
436 free_frec(forward); /* cancel */
437 }
438
439 /* could not send on, return empty answer or address if known for whole domain */
440 if (udpfd != -1)
441 {
442 plen = setup_reply(header, plen, addrp, flags, daemon->local_ttl);
443 send_from(udpfd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND), (char *)header, plen, udpaddr, dst_addr, dst_iface);
444 }
445
446 return 0;
447 }
448
449 static size_t process_reply(struct dns_header *header, time_t now, struct server *server, size_t n, int check_rebind,
450 int checking_disabled, int check_subnet, union mysockaddr *query_source)
451 {
452 unsigned char *pheader, *sizep;
453 char **sets = 0;
454 int munged = 0, is_sign;
455 size_t plen;
456
457 #ifdef HAVE_IPSET
458 /* Similar algorithm to search_servers. */
459 struct ipsets *ipset_pos;
460 unsigned int namelen = strlen(daemon->namebuff);
461 unsigned int matchlen = 0;
462 for (ipset_pos = daemon->ipsets; ipset_pos; ipset_pos = ipset_pos->next)
463 {
464 unsigned int domainlen = strlen(ipset_pos->domain);
465 char *matchstart = daemon->namebuff + namelen - domainlen;
466 if (namelen >= domainlen && hostname_isequal(matchstart, ipset_pos->domain) &&
467 (domainlen == 0 || namelen == domainlen || *(matchstart - 1) == '.' ) &&
468 domainlen >= matchlen) {
469 matchlen = domainlen;
470 sets = ipset_pos->sets;
471 }
472 }
473 #endif
474
475 /* If upstream is advertising a larger UDP packet size
476 than we allow, trim it so that we don't get overlarge
477 requests for the client. We can't do this for signed packets. */
478
479 if ((pheader = find_pseudoheader(header, n, &plen, &sizep, &is_sign)))
480 {
481 if (!is_sign)
482 {
483 unsigned short udpsz;
484 unsigned char *psave = sizep;
485
486 GETSHORT(udpsz, sizep);
487 if (udpsz > daemon->edns_pktsz)
488 PUTSHORT(daemon->edns_pktsz, psave);
489 }
490
491 if (check_subnet && !check_source(header, plen, pheader, query_source))
492 {
493 my_syslog(LOG_WARNING, _("discarding DNS reply: subnet option mismatch"));
494 return 0;
495 }
496 }
497
498
499 /* RFC 4035 sect 4.6 para 3 */
500 if (!is_sign && !option_bool(OPT_DNSSEC))
501 header->hb4 &= ~HB4_AD;
502
503 if (OPCODE(header) != QUERY || (RCODE(header) != NOERROR && RCODE(header) != NXDOMAIN))
504 return n;
505
506 /* Complain loudly if the upstream server is non-recursive. */
507 if (!(header->hb4 & HB4_RA) && RCODE(header) == NOERROR && ntohs(header->ancount) == 0 &&
508 server && !(server->flags & SERV_WARNED_RECURSIVE))
509 {
510 prettyprint_addr(&server->addr, daemon->namebuff);
511 my_syslog(LOG_WARNING, _("nameserver %s refused to do a recursive query"), daemon->namebuff);
512 if (!option_bool(OPT_LOG))
513 server->flags |= SERV_WARNED_RECURSIVE;
514 }
515
516 if (daemon->bogus_addr && RCODE(header) != NXDOMAIN &&
517 check_for_bogus_wildcard(header, n, daemon->namebuff, daemon->bogus_addr, now))
518 {
519 munged = 1;
520 SET_RCODE(header, NXDOMAIN);
521 header->hb3 &= ~HB3_AA;
522 }
523 else
524 {
525 if (RCODE(header) == NXDOMAIN &&
526 extract_request(header, n, daemon->namebuff, NULL) &&
527 check_for_local_domain(daemon->namebuff, now))
528 {
529 /* if we forwarded a query for a locally known name (because it was for
530 an unknown type) and the answer is NXDOMAIN, convert that to NODATA,
531 since we know that the domain exists, even if upstream doesn't */
532 munged = 1;
533 header->hb3 |= HB3_AA;
534 SET_RCODE(header, NOERROR);
535 }
536
537 if (extract_addresses(header, n, daemon->namebuff, now, sets, is_sign, check_rebind, checking_disabled))
538 {
539 my_syslog(LOG_WARNING, _("possible DNS-rebind attack detected: %s"), daemon->namebuff);
540 munged = 1;
541 }
542 }
543
544 /* do this after extract_addresses. Ensure NODATA reply and remove
545 nameserver info. */
546
547 if (munged)
548 {
549 header->ancount = htons(0);
550 header->nscount = htons(0);
551 header->arcount = htons(0);
552 }
553
554 /* the bogus-nxdomain stuff, doctor and NXDOMAIN->NODATA munging can all elide
555 sections of the packet. Find the new length here and put back pseudoheader
556 if it was removed. */
557 return resize_packet(header, n, pheader, plen);
558 }
559
560 /* sets new last_server */
561 void reply_query(int fd, int family, time_t now)
562 {
563 /* packet from peer server, extract data for cache, and send to
564 original requester */
565 struct dns_header *header;
566 union mysockaddr serveraddr;
567 struct frec *forward;
568 socklen_t addrlen = sizeof(serveraddr);
569 ssize_t n = recvfrom(fd, daemon->packet, daemon->edns_pktsz, 0, &serveraddr.sa, &addrlen);
570 size_t nn;
571 struct server *server;
572
573 /* packet buffer overwritten */
574 daemon->srv_save = NULL;
575
576 /* Determine the address of the server replying so that we can mark that as good */
577 serveraddr.sa.sa_family = family;
578 #ifdef HAVE_IPV6
579 if (serveraddr.sa.sa_family == AF_INET6)
580 serveraddr.in6.sin6_flowinfo = 0;
581 #endif
582
583 /* spoof check: answer must come from known server, */
584 for (server = daemon->servers; server; server = server->next)
585 if (!(server->flags & (SERV_LITERAL_ADDRESS | SERV_NO_ADDR)) &&
586 sockaddr_isequal(&server->addr, &serveraddr))
587 break;
588
589 header = (struct dns_header *)daemon->packet;
590
591 if (!server ||
592 n < (int)sizeof(struct dns_header) || !(header->hb3 & HB3_QR) ||
593 !(forward = lookup_frec(ntohs(header->id), questions_crc(header, n, daemon->namebuff))))
594 return;
595
596 server = forward->sentto;
597
598 if ((RCODE(header) == SERVFAIL || RCODE(header) == REFUSED) &&
599 !option_bool(OPT_ORDER) &&
600 forward->forwardall == 0)
601 /* for broken servers, attempt to send to another one. */
602 {
603 unsigned char *pheader;
604 size_t plen;
605 int is_sign;
606
607 /* recreate query from reply */
608 pheader = find_pseudoheader(header, (size_t)n, &plen, NULL, &is_sign);
609 if (!is_sign)
610 {
611 header->ancount = htons(0);
612 header->nscount = htons(0);
613 header->arcount = htons(0);
614 if ((nn = resize_packet(header, (size_t)n, pheader, plen)))
615 {
616 header->hb3 &= ~(HB3_QR | HB3_TC);
617 forward_query(-1, NULL, NULL, 0, header, nn, now, forward);
618 return;
619 }
620 }
621 }
622
623 if ((forward->sentto->flags & SERV_TYPE) == 0)
624 {
625 if (RCODE(header) == SERVFAIL || RCODE(header) == REFUSED)
626 server = NULL;
627 else
628 {
629 struct server *last_server;
630
631 /* find good server by address if possible, otherwise assume the last one we sent to */
632 for (last_server = daemon->servers; last_server; last_server = last_server->next)
633 if (!(last_server->flags & (SERV_LITERAL_ADDRESS | SERV_HAS_DOMAIN | SERV_FOR_NODOTS | SERV_NO_ADDR)) &&
634 sockaddr_isequal(&last_server->addr, &serveraddr))
635 {
636 server = last_server;
637 break;
638 }
639 }
640 if (!option_bool(OPT_ALL_SERVERS))
641 daemon->last_server = server;
642 }
643
644 /* If the answer is an error, keep the forward record in place in case
645 we get a good reply from another server. Kill it when we've
646 had replies from all to avoid filling the forwarding table when
647 everything is broken */
648 if (forward->forwardall == 0 || --forward->forwardall == 1 ||
649 (RCODE(header) != REFUSED && RCODE(header) != SERVFAIL))
650 {
651 int check_rebind = !(forward->flags & FREC_NOREBIND);
652
653 if (!option_bool(OPT_NO_REBIND))
654 check_rebind = 0;
655
656 if ((nn = process_reply(header, now, server, (size_t)n, check_rebind, forward->flags & FREC_CHECKING_DISABLED,
657 forward->flags & FREC_HAS_SUBNET, &forward->source)))
658 {
659 header->id = htons(forward->orig_id);
660 header->hb4 |= HB4_RA; /* recursion if available */
661 send_from(forward->fd, option_bool(OPT_NOWILD) || option_bool (OPT_CLEVERBIND), daemon->packet, nn,
662 &forward->source, &forward->dest, forward->iface);
663 }
664 free_frec(forward); /* cancel */
665 }
666 }
667
668
669 void receive_query(struct listener *listen, time_t now)
670 {
671 struct dns_header *header = (struct dns_header *)daemon->packet;
672 union mysockaddr source_addr;
673 unsigned short type;
674 struct all_addr dst_addr;
675 struct in_addr netmask, dst_addr_4;
676 size_t m;
677 ssize_t n;
678 int if_index = 0;
679 int local_auth = 0, auth_dns = 0;
680 struct iovec iov[1];
681 struct msghdr msg;
682 struct cmsghdr *cmptr;
683 union {
684 struct cmsghdr align; /* this ensures alignment */
685 #ifdef HAVE_IPV6
686 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
687 #endif
688 #if defined(HAVE_LINUX_NETWORK)
689 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
690 #elif defined(IP_RECVDSTADDR) && defined(HAVE_SOLARIS_NETWORK)
691 char control[CMSG_SPACE(sizeof(struct in_addr)) +
692 CMSG_SPACE(sizeof(unsigned int))];
693 #elif defined(IP_RECVDSTADDR)
694 char control[CMSG_SPACE(sizeof(struct in_addr)) +
695 CMSG_SPACE(sizeof(struct sockaddr_dl))];
696 #endif
697 } control_u;
698
699 /* packet buffer overwritten */
700 daemon->srv_save = NULL;
701
702 dst_addr_4.s_addr = 0;
703 netmask.s_addr = 0;
704
705 if (option_bool(OPT_NOWILD) && listen->iface)
706 {
707 auth_dns = listen->iface->dns_auth;
708
709 if (listen->family == AF_INET)
710 {
711 dst_addr_4 = listen->iface->addr.in.sin_addr;
712 netmask = listen->iface->netmask;
713 }
714 }
715
716 iov[0].iov_base = daemon->packet;
717 iov[0].iov_len = daemon->edns_pktsz;
718
719 msg.msg_control = control_u.control;
720 msg.msg_controllen = sizeof(control_u);
721 msg.msg_flags = 0;
722 msg.msg_name = &source_addr;
723 msg.msg_namelen = sizeof(source_addr);
724 msg.msg_iov = iov;
725 msg.msg_iovlen = 1;
726
727 if ((n = recvmsg(listen->fd, &msg, 0)) == -1)
728 return;
729
730 if (n < (int)sizeof(struct dns_header) ||
731 (msg.msg_flags & MSG_TRUNC) ||
732 (header->hb3 & HB3_QR))
733 return;
734
735 source_addr.sa.sa_family = listen->family;
736 #ifdef HAVE_IPV6
737 if (listen->family == AF_INET6)
738 source_addr.in6.sin6_flowinfo = 0;
739 #endif
740
741 if (!option_bool(OPT_NOWILD))
742 {
743 struct ifreq ifr;
744
745 if (msg.msg_controllen < sizeof(struct cmsghdr))
746 return;
747
748 #if defined(HAVE_LINUX_NETWORK)
749 if (listen->family == AF_INET)
750 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
751 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_PKTINFO)
752 {
753 union {
754 unsigned char *c;
755 struct in_pktinfo *p;
756 } p;
757 p.c = CMSG_DATA(cmptr);
758 dst_addr_4 = dst_addr.addr.addr4 = p.p->ipi_spec_dst;
759 if_index = p.p->ipi_ifindex;
760 }
761 #elif defined(IP_RECVDSTADDR) && defined(IP_RECVIF)
762 if (listen->family == AF_INET)
763 {
764 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
765 {
766 union {
767 unsigned char *c;
768 unsigned int *i;
769 struct in_addr *a;
770 #ifndef HAVE_SOLARIS_NETWORK
771 struct sockaddr_dl *s;
772 #endif
773 } p;
774 p.c = CMSG_DATA(cmptr);
775 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVDSTADDR)
776 dst_addr_4 = dst_addr.addr.addr4 = *(p.a);
777 else if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVIF)
778 #ifdef HAVE_SOLARIS_NETWORK
779 if_index = *(p.i);
780 #else
781 if_index = p.s->sdl_index;
782 #endif
783 }
784 }
785 #endif
786
787 #ifdef HAVE_IPV6
788 if (listen->family == AF_INET6)
789 {
790 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
791 if (cmptr->cmsg_level == IPPROTO_IPV6 && cmptr->cmsg_type == daemon->v6pktinfo)
792 {
793 union {
794 unsigned char *c;
795 struct in6_pktinfo *p;
796 } p;
797 p.c = CMSG_DATA(cmptr);
798
799 dst_addr.addr.addr6 = p.p->ipi6_addr;
800 if_index = p.p->ipi6_ifindex;
801 }
802 }
803 #endif
804
805 /* enforce available interface configuration */
806
807 if (!indextoname(listen->fd, if_index, ifr.ifr_name))
808 return;
809
810 if (!iface_check(listen->family, &dst_addr, ifr.ifr_name, &auth_dns))
811 {
812 if (!option_bool(OPT_CLEVERBIND))
813 enumerate_interfaces(0);
814 if (!loopback_exception(listen->fd, listen->family, &dst_addr, ifr.ifr_name) &&
815 !label_exception(if_index, listen->family, &dst_addr))
816 return;
817 }
818
819 if (listen->family == AF_INET && option_bool(OPT_LOCALISE))
820 {
821 struct irec *iface;
822
823 /* get the netmask of the interface whch has the address we were sent to.
824 This is no neccessarily the interface we arrived on. */
825
826 for (iface = daemon->interfaces; iface; iface = iface->next)
827 if (iface->addr.sa.sa_family == AF_INET &&
828 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
829 break;
830
831 /* interface may be new */
832 if (!iface && !option_bool(OPT_CLEVERBIND))
833 enumerate_interfaces(0);
834
835 for (iface = daemon->interfaces; iface; iface = iface->next)
836 if (iface->addr.sa.sa_family == AF_INET &&
837 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
838 break;
839
840 /* If we failed, abandon localisation */
841 if (iface)
842 netmask = iface->netmask;
843 else
844 dst_addr_4.s_addr = 0;
845 }
846 }
847
848 if (extract_request(header, (size_t)n, daemon->namebuff, &type))
849 {
850 char types[20];
851 #ifdef HAVE_AUTH
852 struct auth_zone *zone;
853 #endif
854
855 querystr(auth_dns ? "auth" : "query", types, type);
856
857 if (listen->family == AF_INET)
858 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
859 (struct all_addr *)&source_addr.in.sin_addr, types);
860 #ifdef HAVE_IPV6
861 else
862 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
863 (struct all_addr *)&source_addr.in6.sin6_addr, types);
864 #endif
865
866 #ifdef HAVE_AUTH
867 /* find queries for zones we're authoritative for, and answer them directly */
868 for (zone = daemon->auth_zones; zone; zone = zone->next)
869 if (in_zone(zone, daemon->namebuff, NULL))
870 {
871 auth_dns = 1;
872 local_auth = 1;
873 break;
874 }
875 #endif
876 }
877
878 #ifdef HAVE_AUTH
879 if (auth_dns)
880 {
881 m = answer_auth(header, ((char *) header) + PACKETSZ, (size_t)n, now, &source_addr, local_auth);
882 if (m >= 1)
883 {
884 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
885 (char *)header, m, &source_addr, &dst_addr, if_index);
886 daemon->auth_answer++;
887 }
888 }
889 else
890 #endif
891 {
892 m = answer_request(header, ((char *) header) + PACKETSZ, (size_t)n,
893 dst_addr_4, netmask, now);
894
895 if (m >= 1)
896 {
897 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
898 (char *)header, m, &source_addr, &dst_addr, if_index);
899 daemon->local_answer++;
900 }
901 else if (forward_query(listen->fd, &source_addr, &dst_addr, if_index,
902 header, (size_t)n, now, NULL))
903 daemon->queries_forwarded++;
904 else
905 daemon->local_answer++;
906 }
907 }
908
909 /* The daemon forks before calling this: it should deal with one connection,
910 blocking as neccessary, and then return. Note, need to be a bit careful
911 about resources for debug mode, when the fork is suppressed: that's
912 done by the caller. */
913 unsigned char *tcp_request(int confd, time_t now,
914 union mysockaddr *local_addr, struct in_addr netmask, int auth_dns)
915 {
916 size_t size = 0;
917 int norebind = 0;
918 int local_auth = 0;
919 int checking_disabled, check_subnet;
920 size_t m;
921 unsigned short qtype;
922 unsigned int gotname;
923 unsigned char c1, c2;
924 /* Max TCP packet + slop + size */
925 unsigned char *packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16));
926 unsigned char *payload = &packet[2];
927 /* largest field in header is 16-bits, so this is still sufficiently aligned */
928 struct dns_header *header = (struct dns_header *)payload;
929 u16 *length = (u16 *)packet;
930 struct server *last_server;
931 struct in_addr dst_addr_4;
932 union mysockaddr peer_addr;
933 socklen_t peer_len = sizeof(union mysockaddr);
934
935 if (getpeername(confd, (struct sockaddr *)&peer_addr, &peer_len) == -1)
936 return packet;
937
938 while (1)
939 {
940 if (!packet ||
941 !read_write(confd, &c1, 1, 1) || !read_write(confd, &c2, 1, 1) ||
942 !(size = c1 << 8 | c2) ||
943 !read_write(confd, payload, size, 1))
944 return packet;
945
946 if (size < (int)sizeof(struct dns_header))
947 continue;
948
949 check_subnet = 0;
950
951 /* save state of "cd" flag in query */
952 checking_disabled = header->hb4 & HB4_CD;
953
954 /* RFC 4035: sect 4.6 para 2 */
955 header->hb4 &= ~HB4_AD;
956
957 if ((gotname = extract_request(header, (unsigned int)size, daemon->namebuff, &qtype)))
958 {
959 char types[20];
960 #ifdef HAVE_AUTH
961 struct auth_zone *zone;
962 #endif
963 querystr(auth_dns ? "auth" : "query", types, qtype);
964
965 if (peer_addr.sa.sa_family == AF_INET)
966 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
967 (struct all_addr *)&peer_addr.in.sin_addr, types);
968 #ifdef HAVE_IPV6
969 else
970 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
971 (struct all_addr *)&peer_addr.in6.sin6_addr, types);
972 #endif
973
974 #ifdef HAVE_AUTH
975 /* find queries for zones we're authoritative for, and answer them directly */
976 for (zone = daemon->auth_zones; zone; zone = zone->next)
977 if (in_zone(zone, daemon->namebuff, NULL))
978 {
979 auth_dns = 1;
980 local_auth = 1;
981 break;
982 }
983 #endif
984 }
985
986 if (local_addr->sa.sa_family == AF_INET)
987 dst_addr_4 = local_addr->in.sin_addr;
988 else
989 dst_addr_4.s_addr = 0;
990
991 #ifdef HAVE_AUTH
992 if (auth_dns)
993 m = answer_auth(header, ((char *) header) + 65536, (size_t)size, now, &peer_addr, local_auth);
994 else
995 #endif
996 {
997 /* m > 0 if answered from cache */
998 m = answer_request(header, ((char *) header) + 65536, (size_t)size,
999 dst_addr_4, netmask, now);
1000
1001 /* Do this by steam now we're not in the select() loop */
1002 check_log_writer(NULL);
1003
1004 if (m == 0)
1005 {
1006 unsigned int flags = 0;
1007 struct all_addr *addrp = NULL;
1008 int type = 0;
1009 char *domain = NULL;
1010
1011 if (option_bool(OPT_ADD_MAC))
1012 size = add_mac(header, size, ((char *) header) + 65536, &peer_addr);
1013
1014 if (option_bool(OPT_CLIENT_SUBNET))
1015 {
1016 size_t new = add_source_addr(header, size, ((char *) header) + 65536, &peer_addr);
1017 if (size != new)
1018 {
1019 size = new;
1020 check_subnet = 1;
1021 }
1022 }
1023
1024 if (gotname)
1025 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
1026
1027 if (type != 0 || option_bool(OPT_ORDER) || !daemon->last_server)
1028 last_server = daemon->servers;
1029 else
1030 last_server = daemon->last_server;
1031
1032 if (!flags && last_server)
1033 {
1034 struct server *firstsendto = NULL;
1035 unsigned int crc = questions_crc(header, (unsigned int)size, daemon->namebuff);
1036
1037 /* Loop round available servers until we succeed in connecting to one.
1038 Note that this code subtley ensures that consecutive queries on this connection
1039 which can go to the same server, do so. */
1040 while (1)
1041 {
1042 if (!firstsendto)
1043 firstsendto = last_server;
1044 else
1045 {
1046 if (!(last_server = last_server->next))
1047 last_server = daemon->servers;
1048
1049 if (last_server == firstsendto)
1050 break;
1051 }
1052
1053 /* server for wrong domain */
1054 if (type != (last_server->flags & SERV_TYPE) ||
1055 (type == SERV_HAS_DOMAIN && !hostname_isequal(domain, last_server->domain)))
1056 continue;
1057
1058 if (last_server->tcpfd == -1)
1059 {
1060 if ((last_server->tcpfd = socket(last_server->addr.sa.sa_family, SOCK_STREAM, 0)) == -1)
1061 continue;
1062
1063 if ((!local_bind(last_server->tcpfd, &last_server->source_addr, last_server->interface, 1) ||
1064 connect(last_server->tcpfd, &last_server->addr.sa, sa_len(&last_server->addr)) == -1))
1065 {
1066 close(last_server->tcpfd);
1067 last_server->tcpfd = -1;
1068 continue;
1069 }
1070
1071 #ifdef HAVE_CONNTRACK
1072 /* Copy connection mark of incoming query to outgoing connection. */
1073 if (option_bool(OPT_CONNTRACK))
1074 {
1075 unsigned int mark;
1076 struct all_addr local;
1077 #ifdef HAVE_IPV6
1078 if (local_addr->sa.sa_family == AF_INET6)
1079 local.addr.addr6 = local_addr->in6.sin6_addr;
1080 else
1081 #endif
1082 local.addr.addr4 = local_addr->in.sin_addr;
1083
1084 if (get_incoming_mark(&peer_addr, &local, 1, &mark))
1085 setsockopt(last_server->tcpfd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
1086 }
1087 #endif
1088 }
1089
1090 *length = htons(size);
1091
1092 if (!read_write(last_server->tcpfd, packet, size + sizeof(u16), 0) ||
1093 !read_write(last_server->tcpfd, &c1, 1, 1) ||
1094 !read_write(last_server->tcpfd, &c2, 1, 1))
1095 {
1096 close(last_server->tcpfd);
1097 last_server->tcpfd = -1;
1098 continue;
1099 }
1100
1101 m = (c1 << 8) | c2;
1102 if (!read_write(last_server->tcpfd, payload, m, 1))
1103 return packet;
1104
1105 if (!gotname)
1106 strcpy(daemon->namebuff, "query");
1107 if (last_server->addr.sa.sa_family == AF_INET)
1108 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
1109 (struct all_addr *)&last_server->addr.in.sin_addr, NULL);
1110 #ifdef HAVE_IPV6
1111 else
1112 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
1113 (struct all_addr *)&last_server->addr.in6.sin6_addr, NULL);
1114 #endif
1115
1116 /* There's no point in updating the cache, since this process will exit and
1117 lose the information after a few queries. We make this call for the alias and
1118 bogus-nxdomain side-effects. */
1119 /* If the crc of the question section doesn't match the crc we sent, then
1120 someone might be attempting to insert bogus values into the cache by
1121 sending replies containing questions and bogus answers. */
1122 if (crc == questions_crc(header, (unsigned int)m, daemon->namebuff))
1123 m = process_reply(header, now, last_server, (unsigned int)m,
1124 option_bool(OPT_NO_REBIND) && !norebind, checking_disabled,
1125 check_subnet, &peer_addr);
1126
1127 break;
1128 }
1129 }
1130
1131 /* In case of local answer or no connections made. */
1132 if (m == 0)
1133 m = setup_reply(header, (unsigned int)size, addrp, flags, daemon->local_ttl);
1134 }
1135 }
1136
1137 check_log_writer(NULL);
1138
1139 *length = htons(m);
1140
1141 if (m == 0 || !read_write(confd, packet, m + sizeof(u16), 0))
1142 return packet;
1143 }
1144 }
1145
1146 static struct frec *allocate_frec(time_t now)
1147 {
1148 struct frec *f;
1149
1150 if ((f = (struct frec *)whine_malloc(sizeof(struct frec))))
1151 {
1152 f->next = daemon->frec_list;
1153 f->time = now;
1154 f->sentto = NULL;
1155 f->rfd4 = NULL;
1156 f->flags = 0;
1157 #ifdef HAVE_IPV6
1158 f->rfd6 = NULL;
1159 #endif
1160 daemon->frec_list = f;
1161 }
1162
1163 return f;
1164 }
1165
1166 static struct randfd *allocate_rfd(int family)
1167 {
1168 static int finger = 0;
1169 int i;
1170
1171 /* limit the number of sockets we have open to avoid starvation of
1172 (eg) TFTP. Once we have a reasonable number, randomness should be OK */
1173
1174 for (i = 0; i < RANDOM_SOCKS; i++)
1175 if (daemon->randomsocks[i].refcount == 0)
1176 {
1177 if ((daemon->randomsocks[i].fd = random_sock(family)) == -1)
1178 break;
1179
1180 daemon->randomsocks[i].refcount = 1;
1181 daemon->randomsocks[i].family = family;
1182 return &daemon->randomsocks[i];
1183 }
1184
1185 /* No free ones or cannot get new socket, grab an existing one */
1186 for (i = 0; i < RANDOM_SOCKS; i++)
1187 {
1188 int j = (i+finger) % RANDOM_SOCKS;
1189 if (daemon->randomsocks[j].refcount != 0 &&
1190 daemon->randomsocks[j].family == family &&
1191 daemon->randomsocks[j].refcount != 0xffff)
1192 {
1193 finger = j;
1194 daemon->randomsocks[j].refcount++;
1195 return &daemon->randomsocks[j];
1196 }
1197 }
1198
1199 return NULL; /* doom */
1200 }
1201
1202 static void free_frec(struct frec *f)
1203 {
1204 if (f->rfd4 && --(f->rfd4->refcount) == 0)
1205 close(f->rfd4->fd);
1206
1207 f->rfd4 = NULL;
1208 f->sentto = NULL;
1209 f->flags = 0;
1210
1211 #ifdef HAVE_IPV6
1212 if (f->rfd6 && --(f->rfd6->refcount) == 0)
1213 close(f->rfd6->fd);
1214
1215 f->rfd6 = NULL;
1216 #endif
1217 }
1218
1219 /* if wait==NULL return a free or older than TIMEOUT record.
1220 else return *wait zero if one available, or *wait is delay to
1221 when the oldest in-use record will expire. Impose an absolute
1222 limit of 4*TIMEOUT before we wipe things (for random sockets) */
1223 struct frec *get_new_frec(time_t now, int *wait)
1224 {
1225 struct frec *f, *oldest, *target;
1226 int count;
1227
1228 if (wait)
1229 *wait = 0;
1230
1231 for (f = daemon->frec_list, oldest = NULL, target = NULL, count = 0; f; f = f->next, count++)
1232 if (!f->sentto)
1233 target = f;
1234 else
1235 {
1236 if (difftime(now, f->time) >= 4*TIMEOUT)
1237 {
1238 free_frec(f);
1239 target = f;
1240 }
1241
1242 if (!oldest || difftime(f->time, oldest->time) <= 0)
1243 oldest = f;
1244 }
1245
1246 if (target)
1247 {
1248 target->time = now;
1249 return target;
1250 }
1251
1252 /* can't find empty one, use oldest if there is one
1253 and it's older than timeout */
1254 if (oldest && ((int)difftime(now, oldest->time)) >= TIMEOUT)
1255 {
1256 /* keep stuff for twice timeout if we can by allocating a new
1257 record instead */
1258 if (difftime(now, oldest->time) < 2*TIMEOUT &&
1259 count <= daemon->ftabsize &&
1260 (f = allocate_frec(now)))
1261 return f;
1262
1263 if (!wait)
1264 {
1265 free_frec(oldest);
1266 oldest->time = now;
1267 }
1268 return oldest;
1269 }
1270
1271 /* none available, calculate time 'till oldest record expires */
1272 if (count > daemon->ftabsize)
1273 {
1274 static time_t last_log = 0;
1275
1276 if (oldest && wait)
1277 *wait = oldest->time + (time_t)TIMEOUT - now;
1278
1279 if ((int)difftime(now, last_log) > 5)
1280 {
1281 last_log = now;
1282 my_syslog(LOG_WARNING, _("Maximum number of concurrent DNS queries reached (max: %d)"), daemon->ftabsize);
1283 }
1284
1285 return NULL;
1286 }
1287
1288 if (!(f = allocate_frec(now)) && wait)
1289 /* wait one second on malloc failure */
1290 *wait = 1;
1291
1292 return f; /* OK if malloc fails and this is NULL */
1293 }
1294
1295 /* crc is all-ones if not known. */
1296 static struct frec *lookup_frec(unsigned short id, unsigned int crc)
1297 {
1298 struct frec *f;
1299
1300 for(f = daemon->frec_list; f; f = f->next)
1301 if (f->sentto && f->new_id == id &&
1302 (f->crc == crc || crc == 0xffffffff))
1303 return f;
1304
1305 return NULL;
1306 }
1307
1308 static struct frec *lookup_frec_by_sender(unsigned short id,
1309 union mysockaddr *addr,
1310 unsigned int crc)
1311 {
1312 struct frec *f;
1313
1314 for(f = daemon->frec_list; f; f = f->next)
1315 if (f->sentto &&
1316 f->orig_id == id &&
1317 f->crc == crc &&
1318 sockaddr_isequal(&f->source, addr))
1319 return f;
1320
1321 return NULL;
1322 }
1323
1324 /* A server record is going away, remove references to it */
1325 void server_gone(struct server *server)
1326 {
1327 struct frec *f;
1328
1329 for (f = daemon->frec_list; f; f = f->next)
1330 if (f->sentto && f->sentto == server)
1331 free_frec(f);
1332
1333 if (daemon->last_server == server)
1334 daemon->last_server = NULL;
1335
1336 if (daemon->srv_save == server)
1337 daemon->srv_save = NULL;
1338 }
1339
1340 /* return unique random ids. */
1341 static unsigned short get_id(unsigned int crc)
1342 {
1343 unsigned short ret = 0;
1344
1345 do
1346 ret = rand16();
1347 while (lookup_frec(ret, crc));
1348
1349 return ret;
1350 }
1351
1352
1353
1354
1355