]> git.ipfire.org Git - people/ms/dnsmasq.git/blame - src/forward.c
Only set scope_id in addresses to bind() for linklocal addresses.
[people/ms/dnsmasq.git] / src / forward.c
CommitLineData
61744359 1/* dnsmasq is Copyright (c) 2000-2013 Simon Kelley
9e4abcb5
SK
2
3 This program is free software; you can redistribute it and/or modify
4 it under the terms of the GNU General Public License as published by
824af85b
SK
5 the Free Software Foundation; version 2 dated June, 1991, or
6 (at your option) version 3 dated 29 June, 2007.
7
9e4abcb5
SK
8 This program is distributed in the hope that it will be useful,
9 but WITHOUT ANY WARRANTY; without even the implied warranty of
10 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11 GNU General Public License for more details.
824af85b 12
73a08a24
SK
13 You should have received a copy of the GNU General Public License
14 along with this program. If not, see <http://www.gnu.org/licenses/>.
9e4abcb5
SK
15*/
16
9e4abcb5
SK
17#include "dnsmasq.h"
18
832af0ba 19static struct frec *lookup_frec(unsigned short id, unsigned int crc);
9e4abcb5 20static struct frec *lookup_frec_by_sender(unsigned short id,
fd9fa481
SK
21 union mysockaddr *addr,
22 unsigned int crc);
316e2730 23static unsigned short get_id(unsigned int crc);
1a6bca81
SK
24static void free_frec(struct frec *f);
25static struct randfd *allocate_rfd(int family);
9e4abcb5 26
824af85b 27/* Send a UDP packet with its source address set as "source"
44a2a316 28 unless nowild is true, when we just send it with the kernel default */
29689cfa
SK
29int send_from(int fd, int nowild, char *packet, size_t len,
30 union mysockaddr *to, struct all_addr *source,
50303b19 31 unsigned int iface)
9e4abcb5 32{
44a2a316
SK
33 struct msghdr msg;
34 struct iovec iov[1];
44a2a316
SK
35 union {
36 struct cmsghdr align; /* this ensures alignment */
5e9e0efb 37#if defined(HAVE_LINUX_NETWORK)
44a2a316
SK
38 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
39#elif defined(IP_SENDSRCADDR)
40 char control[CMSG_SPACE(sizeof(struct in_addr))];
41#endif
42#ifdef HAVE_IPV6
43 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
44#endif
45 } control_u;
feba5c1d 46
44a2a316
SK
47 iov[0].iov_base = packet;
48 iov[0].iov_len = len;
49
feba5c1d
SK
50 msg.msg_control = NULL;
51 msg.msg_controllen = 0;
44a2a316
SK
52 msg.msg_flags = 0;
53 msg.msg_name = to;
54 msg.msg_namelen = sa_len(to);
55 msg.msg_iov = iov;
56 msg.msg_iovlen = 1;
feba5c1d 57
26128d27 58 if (!nowild)
44a2a316 59 {
26128d27 60 struct cmsghdr *cmptr;
feba5c1d
SK
61 msg.msg_control = &control_u;
62 msg.msg_controllen = sizeof(control_u);
26128d27
SK
63 cmptr = CMSG_FIRSTHDR(&msg);
64
65 if (to->sa.sa_family == AF_INET)
66 {
5e9e0efb 67#if defined(HAVE_LINUX_NETWORK)
8ef5ada2
SK
68 struct in_pktinfo p;
69 p.ipi_ifindex = 0;
70 p.ipi_spec_dst = source->addr.addr4;
71 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
26128d27 72 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_pktinfo));
c72daea8 73 cmptr->cmsg_level = IPPROTO_IP;
26128d27 74 cmptr->cmsg_type = IP_PKTINFO;
44a2a316 75#elif defined(IP_SENDSRCADDR)
8ef5ada2 76 memcpy(CMSG_DATA(cmptr), &(source->addr.addr4), sizeof(source->addr.addr4));
26128d27
SK
77 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in_addr));
78 cmptr->cmsg_level = IPPROTO_IP;
79 cmptr->cmsg_type = IP_SENDSRCADDR;
44a2a316 80#endif
26128d27 81 }
26128d27 82 else
b8187c80 83#ifdef HAVE_IPV6
26128d27 84 {
8ef5ada2
SK
85 struct in6_pktinfo p;
86 p.ipi6_ifindex = iface; /* Need iface for IPv6 to handle link-local addrs */
87 p.ipi6_addr = source->addr.addr6;
88 memcpy(CMSG_DATA(cmptr), &p, sizeof(p));
26128d27 89 msg.msg_controllen = cmptr->cmsg_len = CMSG_LEN(sizeof(struct in6_pktinfo));
316e2730 90 cmptr->cmsg_type = daemon->v6pktinfo;
c72daea8 91 cmptr->cmsg_level = IPPROTO_IPV6;
26128d27 92 }
3d8df260 93#else
c72daea8 94 (void)iface; /* eliminate warning */
44a2a316 95#endif
26128d27 96 }
feba5c1d 97
29d28dda 98 while (sendmsg(fd, &msg, 0) == -1)
feba5c1d 99 {
fd9fa481 100 if (retry_send())
29d28dda 101 continue;
22d904db 102
29d28dda
SK
103 /* If interface is still in DAD, EINVAL results - ignore that. */
104 if (errno == EINVAL)
105 break;
29689cfa 106
29d28dda 107 my_syslog(LOG_ERR, _("failed to send packet: %s"), strerror(errno));
29689cfa 108 return 0;
feba5c1d 109 }
29d28dda 110
29689cfa 111 return 1;
9e4abcb5 112}
44a2a316 113
28866e95
SK
114static unsigned int search_servers(time_t now, struct all_addr **addrpp,
115 unsigned int qtype, char *qdomain, int *type, char **domain, int *norebind)
feba5c1d
SK
116
117{
118 /* If the query ends in the domain in one of our servers, set
119 domain to point to that name. We find the largest match to allow both
120 domain.org and sub.domain.org to exist. */
121
122 unsigned int namelen = strlen(qdomain);
123 unsigned int matchlen = 0;
124 struct server *serv;
28866e95 125 unsigned int flags = 0;
feba5c1d 126
3be34541 127 for (serv = daemon->servers; serv; serv=serv->next)
feba5c1d 128 /* domain matches take priority over NODOTS matches */
3d8df260 129 if ((serv->flags & SERV_FOR_NODOTS) && *type != SERV_HAS_DOMAIN && !strchr(qdomain, '.') && namelen != 0)
feba5c1d 130 {
28866e95 131 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
feba5c1d 132 *type = SERV_FOR_NODOTS;
feba5c1d 133 if (serv->flags & SERV_NO_ADDR)
36717eee
SK
134 flags = F_NXDOMAIN;
135 else if (serv->flags & SERV_LITERAL_ADDRESS)
136 {
137 if (sflag & qtype)
138 {
139 flags = sflag;
140 if (serv->addr.sa.sa_family == AF_INET)
141 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
feba5c1d 142#ifdef HAVE_IPV6
36717eee
SK
143 else
144 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
feba5c1d 145#endif
36717eee 146 }
824af85b 147 else if (!flags || (flags & F_NXDOMAIN))
36717eee
SK
148 flags = F_NOERR;
149 }
feba5c1d
SK
150 }
151 else if (serv->flags & SERV_HAS_DOMAIN)
152 {
153 unsigned int domainlen = strlen(serv->domain);
b8187c80 154 char *matchstart = qdomain + namelen - domainlen;
feba5c1d 155 if (namelen >= domainlen &&
b8187c80 156 hostname_isequal(matchstart, serv->domain) &&
8ef5ada2 157 (domainlen == 0 || namelen == domainlen || *(matchstart-1) == '.' ))
feba5c1d 158 {
8ef5ada2
SK
159 if (serv->flags & SERV_NO_REBIND)
160 *norebind = 1;
28866e95 161 else
feba5c1d 162 {
28866e95
SK
163 unsigned int sflag = serv->addr.sa.sa_family == AF_INET ? F_IPV4 : F_IPV6;
164 /* implement priority rules for --address and --server for same domain.
165 --address wins if the address is for the correct AF
166 --server wins otherwise. */
167 if (domainlen != 0 && domainlen == matchlen)
36717eee 168 {
28866e95 169 if ((serv->flags & SERV_LITERAL_ADDRESS))
8ef5ada2 170 {
28866e95
SK
171 if (!(sflag & qtype) && flags == 0)
172 continue;
173 }
174 else
175 {
176 if (flags & (F_IPV4 | F_IPV6))
177 continue;
178 }
179 }
180
181 if (domainlen >= matchlen)
182 {
183 *type = serv->flags & (SERV_HAS_DOMAIN | SERV_USE_RESOLV | SERV_NO_REBIND);
184 *domain = serv->domain;
185 matchlen = domainlen;
186 if (serv->flags & SERV_NO_ADDR)
187 flags = F_NXDOMAIN;
188 else if (serv->flags & SERV_LITERAL_ADDRESS)
189 {
190 if (sflag & qtype)
191 {
192 flags = sflag;
193 if (serv->addr.sa.sa_family == AF_INET)
194 *addrpp = (struct all_addr *)&serv->addr.in.sin_addr;
feba5c1d 195#ifdef HAVE_IPV6
28866e95
SK
196 else
197 *addrpp = (struct all_addr *)&serv->addr.in6.sin6_addr;
feba5c1d 198#endif
28866e95
SK
199 }
200 else if (!flags || (flags & F_NXDOMAIN))
201 flags = F_NOERR;
8ef5ada2 202 }
28866e95
SK
203 else
204 flags = 0;
205 }
206 }
8ef5ada2 207 }
feba5c1d 208 }
8ef5ada2 209
7de060b0 210 if (flags == 0 && !(qtype & F_QUERY) &&
28866e95 211 option_bool(OPT_NODOTS_LOCAL) && !strchr(qdomain, '.') && namelen != 0)
7de060b0
SK
212 /* don't forward A or AAAA queries for simple names, except the empty name */
213 flags = F_NOERR;
8ef5ada2 214
5aabfc78 215 if (flags == F_NXDOMAIN && check_for_local_domain(qdomain, now))
c1bb8504 216 flags = F_NOERR;
feba5c1d 217
824af85b
SK
218 if (flags)
219 {
220 int logflags = 0;
221
222 if (flags == F_NXDOMAIN || flags == F_NOERR)
223 logflags = F_NEG | qtype;
224
1a6bca81 225 log_query(logflags | flags | F_CONFIG | F_FORWARD, qdomain, *addrpp, NULL);
824af85b 226 }
8ef5ada2
SK
227 else if ((*type) & SERV_USE_RESOLV)
228 {
229 *type = 0; /* use normal servers for this domain */
230 *domain = NULL;
231 }
feba5c1d
SK
232 return flags;
233}
44a2a316 234
824af85b
SK
235static int forward_query(int udpfd, union mysockaddr *udpaddr,
236 struct all_addr *dst_addr, unsigned int dst_iface,
572b41eb 237 struct dns_header *header, size_t plen, time_t now, struct frec *forward)
9e4abcb5 238{
9e4abcb5 239 char *domain = NULL;
8ef5ada2 240 int type = 0, norebind = 0;
9e4abcb5 241 struct all_addr *addrp = NULL;
cdeda28f 242 unsigned int crc = questions_crc(header, plen, daemon->namebuff);
28866e95
SK
243 unsigned int flags = 0;
244 unsigned int gotname = extract_request(header, plen, daemon->namebuff, NULL);
de37951c 245 struct server *start = NULL;
7de060b0 246
28866e95 247 /* RFC 4035: sect 4.6 para 2 */
572b41eb
SK
248 header->hb4 &= ~HB4_AD;
249
3d8df260
SK
250 /* may be no servers available. */
251 if (!daemon->servers)
9e4abcb5 252 forward = NULL;
b8187c80 253 else if (forward || (forward = lookup_frec_by_sender(ntohs(header->id), udpaddr, crc)))
9e4abcb5 254 {
de37951c 255 /* retry on existing query, send to all available servers */
9e4abcb5 256 domain = forward->sentto->domain;
824af85b 257 forward->sentto->failed_queries++;
28866e95 258 if (!option_bool(OPT_ORDER))
de37951c 259 {
0a852541 260 forward->forwardall = 1;
3be34541 261 daemon->last_server = NULL;
de37951c 262 }
9e4abcb5 263 type = forward->sentto->flags & SERV_TYPE;
de37951c 264 if (!(start = forward->sentto->next))
3be34541 265 start = daemon->servers; /* at end of list, recycle */
9e4abcb5
SK
266 header->id = htons(forward->new_id);
267 }
268 else
269 {
270 if (gotname)
8ef5ada2 271 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
9e4abcb5 272
5aabfc78 273 if (!flags && !(forward = get_new_frec(now, NULL)))
feba5c1d
SK
274 /* table full - server failure. */
275 flags = F_NEG;
9e4abcb5
SK
276
277 if (forward)
278 {
0a852541
SK
279 forward->source = *udpaddr;
280 forward->dest = *dst_addr;
281 forward->iface = dst_iface;
0a852541 282 forward->orig_id = ntohs(header->id);
316e2730 283 forward->new_id = get_id(crc);
832af0ba 284 forward->fd = udpfd;
0a852541
SK
285 forward->crc = crc;
286 forward->forwardall = 0;
ed4c0767 287 forward->flags = 0;
28866e95
SK
288 if (norebind)
289 forward->flags |= FREC_NOREBIND;
572b41eb 290 if (header->hb4 & HB4_CD)
28866e95 291 forward->flags |= FREC_CHECKING_DISABLED;
0a852541 292
28866e95
SK
293 header->id = htons(forward->new_id);
294
8ef5ada2
SK
295 /* In strict_order mode, always try servers in the order
296 specified in resolv.conf, if a domain is given
297 always try all the available servers,
9e4abcb5
SK
298 otherwise, use the one last known to work. */
299
8ef5ada2
SK
300 if (type == 0)
301 {
28866e95 302 if (option_bool(OPT_ORDER))
8ef5ada2
SK
303 start = daemon->servers;
304 else if (!(start = daemon->last_server) ||
305 daemon->forwardcount++ > FORWARD_TEST ||
306 difftime(now, daemon->forwardtime) > FORWARD_TIME)
307 {
308 start = daemon->servers;
309 forward->forwardall = 1;
310 daemon->forwardcount = 0;
311 daemon->forwardtime = now;
312 }
313 }
314 else
de37951c 315 {
3be34541 316 start = daemon->servers;
28866e95 317 if (!option_bool(OPT_ORDER))
8ef5ada2 318 forward->forwardall = 1;
de37951c 319 }
9e4abcb5
SK
320 }
321 }
feba5c1d 322
9e4abcb5
SK
323 /* check for send errors here (no route to host)
324 if we fail to send to all nameservers, send back an error
325 packet straight away (helps modem users when offline) */
326
327 if (!flags && forward)
328 {
de37951c
SK
329 struct server *firstsentto = start;
330 int forwarded = 0;
28866e95 331
797a7afb
GT
332 if (option_bool(OPT_ADD_MAC))
333 plen = add_mac(header, plen, ((char *) header) + PACKETSZ, &forward->source);
28866e95 334
ed4c0767
SK
335 if (option_bool(OPT_CLIENT_SUBNET))
336 {
337 size_t new = add_source_addr(header, plen, ((char *) header) + PACKETSZ, &forward->source);
338 if (new != plen)
339 {
340 plen = new;
341 forward->flags |= FREC_HAS_SUBNET;
342 }
343 }
344
9e4abcb5
SK
345 while (1)
346 {
9e4abcb5
SK
347 /* only send to servers dealing with our domain.
348 domain may be NULL, in which case server->domain
349 must be NULL also. */
350
de37951c 351 if (type == (start->flags & SERV_TYPE) &&
fd9fa481
SK
352 (type != SERV_HAS_DOMAIN || hostname_isequal(domain, start->domain)) &&
353 !(start->flags & SERV_LITERAL_ADDRESS))
9e4abcb5 354 {
1a6bca81
SK
355 int fd;
356
357 /* find server socket to use, may need to get random one. */
358 if (start->sfd)
359 fd = start->sfd->fd;
360 else
361 {
362#ifdef HAVE_IPV6
363 if (start->addr.sa.sa_family == AF_INET6)
364 {
365 if (!forward->rfd6 &&
366 !(forward->rfd6 = allocate_rfd(AF_INET6)))
367 break;
3927da46 368 daemon->rfd_save = forward->rfd6;
1a6bca81
SK
369 fd = forward->rfd6->fd;
370 }
371 else
372#endif
373 {
374 if (!forward->rfd4 &&
375 !(forward->rfd4 = allocate_rfd(AF_INET)))
376 break;
3927da46 377 daemon->rfd_save = forward->rfd4;
1a6bca81
SK
378 fd = forward->rfd4->fd;
379 }
7de060b0
SK
380
381#ifdef HAVE_CONNTRACK
382 /* Copy connection mark of incoming query to outgoing connection. */
383 if (option_bool(OPT_CONNTRACK))
384 {
385 unsigned int mark;
797a7afb 386 if (get_incoming_mark(&forward->source, &forward->dest, 0, &mark))
7de060b0
SK
387 setsockopt(fd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
388 }
389#endif
1a6bca81
SK
390 }
391
392 if (sendto(fd, (char *)header, plen, 0,
feba5c1d 393 &start->addr.sa,
fd9fa481
SK
394 sa_len(&start->addr)) == -1)
395 {
396 if (retry_send())
397 continue;
398 }
399 else
9e4abcb5 400 {
cdeda28f
SK
401 /* Keep info in case we want to re-send this packet */
402 daemon->srv_save = start;
403 daemon->packet_len = plen;
404
de37951c 405 if (!gotname)
3be34541 406 strcpy(daemon->namebuff, "query");
de37951c 407 if (start->addr.sa.sa_family == AF_INET)
3be34541 408 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
1a6bca81 409 (struct all_addr *)&start->addr.in.sin_addr, NULL);
de37951c
SK
410#ifdef HAVE_IPV6
411 else
3be34541 412 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
1a6bca81 413 (struct all_addr *)&start->addr.in6.sin6_addr, NULL);
de37951c 414#endif
824af85b 415 start->queries++;
de37951c
SK
416 forwarded = 1;
417 forward->sentto = start;
0a852541 418 if (!forward->forwardall)
de37951c 419 break;
0a852541 420 forward->forwardall++;
9e4abcb5
SK
421 }
422 }
423
de37951c 424 if (!(start = start->next))
3be34541 425 start = daemon->servers;
9e4abcb5 426
de37951c 427 if (start == firstsentto)
9e4abcb5
SK
428 break;
429 }
430
de37951c 431 if (forwarded)
824af85b 432 return 1;
de37951c 433
9e4abcb5
SK
434 /* could not send on, prepare to return */
435 header->id = htons(forward->orig_id);
1a6bca81 436 free_frec(forward); /* cancel */
9e4abcb5
SK
437 }
438
439 /* could not send on, return empty answer or address if known for whole domain */
b8187c80
SK
440 if (udpfd != -1)
441 {
cdeda28f 442 plen = setup_reply(header, plen, addrp, flags, daemon->local_ttl);
54dd393f 443 send_from(udpfd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND), (char *)header, plen, udpaddr, dst_addr, dst_iface);
b8187c80
SK
444 }
445
824af85b 446 return 0;
9e4abcb5
SK
447}
448
ed4c0767
SK
449static size_t process_reply(struct dns_header *header, time_t now, struct server *server, size_t n, int check_rebind,
450 int checking_disabled, int check_subnet, union mysockaddr *query_source)
feba5c1d 451{
36717eee 452 unsigned char *pheader, *sizep;
13d86c73 453 char **sets = 0;
832af0ba 454 int munged = 0, is_sign;
cdeda28f
SK
455 size_t plen;
456
13d86c73
JD
457#ifdef HAVE_IPSET
458 /* Similar algorithm to search_servers. */
459 struct ipsets *ipset_pos;
460 unsigned int namelen = strlen(daemon->namebuff);
461 unsigned int matchlen = 0;
462 for (ipset_pos = daemon->ipsets; ipset_pos; ipset_pos = ipset_pos->next)
463 {
464 unsigned int domainlen = strlen(ipset_pos->domain);
465 char *matchstart = daemon->namebuff + namelen - domainlen;
466 if (namelen >= domainlen && hostname_isequal(matchstart, ipset_pos->domain) &&
467 (domainlen == 0 || namelen == domainlen || *(matchstart - 1) == '.' ) &&
468 domainlen >= matchlen) {
469 matchlen = domainlen;
470 sets = ipset_pos->sets;
471 }
472 }
473#endif
474
feba5c1d 475 /* If upstream is advertising a larger UDP packet size
9009d746
SK
476 than we allow, trim it so that we don't get overlarge
477 requests for the client. We can't do this for signed packets. */
feba5c1d 478
ed4c0767 479 if ((pheader = find_pseudoheader(header, n, &plen, &sizep, &is_sign)))
feba5c1d 480 {
ed4c0767
SK
481 if (!is_sign)
482 {
483 unsigned short udpsz;
484 unsigned char *psave = sizep;
485
486 GETSHORT(udpsz, sizep);
487 if (udpsz > daemon->edns_pktsz)
488 PUTSHORT(daemon->edns_pktsz, psave);
489 }
feba5c1d 490
ed4c0767
SK
491 if (check_subnet && !check_source(header, plen, pheader, query_source))
492 {
493 my_syslog(LOG_WARNING, _("discarding DNS reply: subnet option mismatch"));
494 return 0;
495 }
feba5c1d 496 }
ed4c0767 497
feba5c1d 498
28866e95
SK
499 /* RFC 4035 sect 4.6 para 3 */
500 if (!is_sign && !option_bool(OPT_DNSSEC))
ed4c0767 501 header->hb4 &= ~HB4_AD;
28866e95 502
572b41eb 503 if (OPCODE(header) != QUERY || (RCODE(header) != NOERROR && RCODE(header) != NXDOMAIN))
0a852541
SK
504 return n;
505
feba5c1d 506 /* Complain loudly if the upstream server is non-recursive. */
572b41eb 507 if (!(header->hb4 & HB4_RA) && RCODE(header) == NOERROR && ntohs(header->ancount) == 0 &&
0a852541 508 server && !(server->flags & SERV_WARNED_RECURSIVE))
feba5c1d 509 {
3d8df260 510 prettyprint_addr(&server->addr, daemon->namebuff);
f2621c7f 511 my_syslog(LOG_WARNING, _("nameserver %s refused to do a recursive query"), daemon->namebuff);
28866e95 512 if (!option_bool(OPT_LOG))
0a852541
SK
513 server->flags |= SERV_WARNED_RECURSIVE;
514 }
515
572b41eb 516 if (daemon->bogus_addr && RCODE(header) != NXDOMAIN &&
fd9fa481 517 check_for_bogus_wildcard(header, n, daemon->namebuff, daemon->bogus_addr, now))
feba5c1d 518 {
fd9fa481 519 munged = 1;
572b41eb
SK
520 SET_RCODE(header, NXDOMAIN);
521 header->hb3 &= ~HB3_AA;
36717eee 522 }
fd9fa481 523 else
36717eee 524 {
572b41eb 525 if (RCODE(header) == NXDOMAIN &&
fd9fa481 526 extract_request(header, n, daemon->namebuff, NULL) &&
5aabfc78 527 check_for_local_domain(daemon->namebuff, now))
36717eee
SK
528 {
529 /* if we forwarded a query for a locally known name (because it was for
530 an unknown type) and the answer is NXDOMAIN, convert that to NODATA,
531 since we know that the domain exists, even if upstream doesn't */
fd9fa481 532 munged = 1;
572b41eb
SK
533 header->hb3 |= HB3_AA;
534 SET_RCODE(header, NOERROR);
feba5c1d 535 }
832af0ba 536
13d86c73 537 if (extract_addresses(header, n, daemon->namebuff, now, sets, is_sign, check_rebind, checking_disabled))
824af85b 538 {
8ef5ada2 539 my_syslog(LOG_WARNING, _("possible DNS-rebind attack detected: %s"), daemon->namebuff);
824af85b
SK
540 munged = 1;
541 }
feba5c1d 542 }
fd9fa481
SK
543
544 /* do this after extract_addresses. Ensure NODATA reply and remove
545 nameserver info. */
546
547 if (munged)
548 {
549 header->ancount = htons(0);
550 header->nscount = htons(0);
551 header->arcount = htons(0);
552 }
553
36717eee
SK
554 /* the bogus-nxdomain stuff, doctor and NXDOMAIN->NODATA munging can all elide
555 sections of the packet. Find the new length here and put back pseudoheader
556 if it was removed. */
557 return resize_packet(header, n, pheader, plen);
feba5c1d
SK
558}
559
3be34541 560/* sets new last_server */
1a6bca81 561void reply_query(int fd, int family, time_t now)
9e4abcb5
SK
562{
563 /* packet from peer server, extract data for cache, and send to
564 original requester */
572b41eb 565 struct dns_header *header;
de37951c 566 union mysockaddr serveraddr;
832af0ba 567 struct frec *forward;
de37951c 568 socklen_t addrlen = sizeof(serveraddr);
1a6bca81 569 ssize_t n = recvfrom(fd, daemon->packet, daemon->edns_pktsz, 0, &serveraddr.sa, &addrlen);
cdeda28f 570 size_t nn;
1a6bca81
SK
571 struct server *server;
572
cdeda28f
SK
573 /* packet buffer overwritten */
574 daemon->srv_save = NULL;
832af0ba 575
de37951c 576 /* Determine the address of the server replying so that we can mark that as good */
1a6bca81 577 serveraddr.sa.sa_family = family;
de37951c
SK
578#ifdef HAVE_IPV6
579 if (serveraddr.sa.sa_family == AF_INET6)
5e9e0efb 580 serveraddr.in6.sin6_flowinfo = 0;
de37951c 581#endif
9e4abcb5 582
1a6bca81
SK
583 /* spoof check: answer must come from known server, */
584 for (server = daemon->servers; server; server = server->next)
585 if (!(server->flags & (SERV_LITERAL_ADDRESS | SERV_NO_ADDR)) &&
586 sockaddr_isequal(&server->addr, &serveraddr))
587 break;
588
572b41eb 589 header = (struct dns_header *)daemon->packet;
fd9fa481 590
1a6bca81 591 if (!server ||
572b41eb 592 n < (int)sizeof(struct dns_header) || !(header->hb3 & HB3_QR) ||
1a6bca81
SK
593 !(forward = lookup_frec(ntohs(header->id), questions_crc(header, n, daemon->namebuff))))
594 return;
595
596 server = forward->sentto;
597
572b41eb 598 if ((RCODE(header) == SERVFAIL || RCODE(header) == REFUSED) &&
28866e95 599 !option_bool(OPT_ORDER) &&
1a6bca81
SK
600 forward->forwardall == 0)
601 /* for broken servers, attempt to send to another one. */
9e4abcb5 602 {
1a6bca81
SK
603 unsigned char *pheader;
604 size_t plen;
605 int is_sign;
832af0ba 606
1a6bca81
SK
607 /* recreate query from reply */
608 pheader = find_pseudoheader(header, (size_t)n, &plen, NULL, &is_sign);
609 if (!is_sign)
832af0ba 610 {
1a6bca81
SK
611 header->ancount = htons(0);
612 header->nscount = htons(0);
613 header->arcount = htons(0);
614 if ((nn = resize_packet(header, (size_t)n, pheader, plen)))
832af0ba 615 {
572b41eb 616 header->hb3 &= ~(HB3_QR | HB3_TC);
1a6bca81
SK
617 forward_query(-1, NULL, NULL, 0, header, nn, now, forward);
618 return;
832af0ba 619 }
832af0ba 620 }
1a6bca81
SK
621 }
622
623 if ((forward->sentto->flags & SERV_TYPE) == 0)
624 {
572b41eb 625 if (RCODE(header) == SERVFAIL || RCODE(header) == REFUSED)
1a6bca81
SK
626 server = NULL;
627 else
b8187c80 628 {
1a6bca81
SK
629 struct server *last_server;
630
631 /* find good server by address if possible, otherwise assume the last one we sent to */
632 for (last_server = daemon->servers; last_server; last_server = last_server->next)
633 if (!(last_server->flags & (SERV_LITERAL_ADDRESS | SERV_HAS_DOMAIN | SERV_FOR_NODOTS | SERV_NO_ADDR)) &&
634 sockaddr_isequal(&last_server->addr, &serveraddr))
635 {
636 server = last_server;
637 break;
638 }
639 }
28866e95 640 if (!option_bool(OPT_ALL_SERVERS))
1a6bca81
SK
641 daemon->last_server = server;
642 }
643
644 /* If the answer is an error, keep the forward record in place in case
645 we get a good reply from another server. Kill it when we've
646 had replies from all to avoid filling the forwarding table when
647 everything is broken */
648 if (forward->forwardall == 0 || --forward->forwardall == 1 ||
572b41eb 649 (RCODE(header) != REFUSED && RCODE(header) != SERVFAIL))
1a6bca81 650 {
28866e95 651 int check_rebind = !(forward->flags & FREC_NOREBIND);
8ef5ada2 652
28866e95 653 if (!option_bool(OPT_NO_REBIND))
8ef5ada2
SK
654 check_rebind = 0;
655
ed4c0767
SK
656 if ((nn = process_reply(header, now, server, (size_t)n, check_rebind, forward->flags & FREC_CHECKING_DISABLED,
657 forward->flags & FREC_HAS_SUBNET, &forward->source)))
1a6bca81
SK
658 {
659 header->id = htons(forward->orig_id);
572b41eb 660 header->hb4 |= HB4_RA; /* recursion if available */
54dd393f 661 send_from(forward->fd, option_bool(OPT_NOWILD) || option_bool (OPT_CLEVERBIND), daemon->packet, nn,
50303b19 662 &forward->source, &forward->dest, forward->iface);
b8187c80 663 }
1a6bca81 664 free_frec(forward); /* cancel */
9e4abcb5 665 }
9e4abcb5 666}
44a2a316 667
1a6bca81 668
5aabfc78 669void receive_query(struct listener *listen, time_t now)
44a2a316 670{
572b41eb 671 struct dns_header *header = (struct dns_header *)daemon->packet;
44a2a316 672 union mysockaddr source_addr;
c1bb8504 673 unsigned short type;
44a2a316 674 struct all_addr dst_addr;
f6b7dc47 675 struct in_addr netmask, dst_addr_4;
cdeda28f
SK
676 size_t m;
677 ssize_t n;
3b195961
VG
678 int if_index = 0, auth_dns = 0;
679#ifdef HAVE_AUTH
680 int local_auth = 0;
681#endif
44a2a316
SK
682 struct iovec iov[1];
683 struct msghdr msg;
684 struct cmsghdr *cmptr;
44a2a316
SK
685 union {
686 struct cmsghdr align; /* this ensures alignment */
687#ifdef HAVE_IPV6
688 char control6[CMSG_SPACE(sizeof(struct in6_pktinfo))];
689#endif
5e9e0efb 690#if defined(HAVE_LINUX_NETWORK)
44a2a316 691 char control[CMSG_SPACE(sizeof(struct in_pktinfo))];
824af85b
SK
692#elif defined(IP_RECVDSTADDR) && defined(HAVE_SOLARIS_NETWORK)
693 char control[CMSG_SPACE(sizeof(struct in_addr)) +
694 CMSG_SPACE(sizeof(unsigned int))];
44a2a316
SK
695#elif defined(IP_RECVDSTADDR)
696 char control[CMSG_SPACE(sizeof(struct in_addr)) +
697 CMSG_SPACE(sizeof(struct sockaddr_dl))];
698#endif
699 } control_u;
700
cdeda28f
SK
701 /* packet buffer overwritten */
702 daemon->srv_save = NULL;
703
4f7b304f
SK
704 dst_addr_4.s_addr = 0;
705 netmask.s_addr = 0;
706
7e5664bd 707 if (option_bool(OPT_NOWILD) && listen->iface)
3d8df260 708 {
4f7b304f
SK
709 auth_dns = listen->iface->dns_auth;
710
711 if (listen->family == AF_INET)
712 {
713 dst_addr_4 = listen->iface->addr.in.sin_addr;
714 netmask = listen->iface->netmask;
715 }
3d8df260 716 }
4f7b304f 717
3be34541
SK
718 iov[0].iov_base = daemon->packet;
719 iov[0].iov_len = daemon->edns_pktsz;
44a2a316
SK
720
721 msg.msg_control = control_u.control;
722 msg.msg_controllen = sizeof(control_u);
723 msg.msg_flags = 0;
724 msg.msg_name = &source_addr;
725 msg.msg_namelen = sizeof(source_addr);
726 msg.msg_iov = iov;
727 msg.msg_iovlen = 1;
728
de37951c 729 if ((n = recvmsg(listen->fd, &msg, 0)) == -1)
3be34541 730 return;
44a2a316 731
572b41eb 732 if (n < (int)sizeof(struct dns_header) ||
5e9e0efb 733 (msg.msg_flags & MSG_TRUNC) ||
572b41eb 734 (header->hb3 & HB3_QR))
26128d27
SK
735 return;
736
44a2a316
SK
737 source_addr.sa.sa_family = listen->family;
738#ifdef HAVE_IPV6
739 if (listen->family == AF_INET6)
5e9e0efb 740 source_addr.in6.sin6_flowinfo = 0;
44a2a316 741#endif
28866e95
SK
742
743 if (!option_bool(OPT_NOWILD))
26128d27
SK
744 {
745 struct ifreq ifr;
746
747 if (msg.msg_controllen < sizeof(struct cmsghdr))
748 return;
44a2a316 749
5e9e0efb 750#if defined(HAVE_LINUX_NETWORK)
26128d27
SK
751 if (listen->family == AF_INET)
752 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
c72daea8 753 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_PKTINFO)
26128d27 754 {
8ef5ada2
SK
755 union {
756 unsigned char *c;
757 struct in_pktinfo *p;
758 } p;
759 p.c = CMSG_DATA(cmptr);
760 dst_addr_4 = dst_addr.addr.addr4 = p.p->ipi_spec_dst;
761 if_index = p.p->ipi_ifindex;
26128d27
SK
762 }
763#elif defined(IP_RECVDSTADDR) && defined(IP_RECVIF)
764 if (listen->family == AF_INET)
44a2a316 765 {
26128d27 766 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
8ef5ada2
SK
767 {
768 union {
769 unsigned char *c;
770 unsigned int *i;
771 struct in_addr *a;
772#ifndef HAVE_SOLARIS_NETWORK
773 struct sockaddr_dl *s;
774#endif
775 } p;
776 p.c = CMSG_DATA(cmptr);
777 if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVDSTADDR)
778 dst_addr_4 = dst_addr.addr.addr4 = *(p.a);
779 else if (cmptr->cmsg_level == IPPROTO_IP && cmptr->cmsg_type == IP_RECVIF)
824af85b 780#ifdef HAVE_SOLARIS_NETWORK
8ef5ada2 781 if_index = *(p.i);
824af85b 782#else
8ef5ada2 783 if_index = p.s->sdl_index;
824af85b 784#endif
8ef5ada2 785 }
44a2a316 786 }
44a2a316 787#endif
26128d27 788
44a2a316 789#ifdef HAVE_IPV6
26128d27
SK
790 if (listen->family == AF_INET6)
791 {
792 for (cmptr = CMSG_FIRSTHDR(&msg); cmptr; cmptr = CMSG_NXTHDR(&msg, cmptr))
c72daea8 793 if (cmptr->cmsg_level == IPPROTO_IPV6 && cmptr->cmsg_type == daemon->v6pktinfo)
26128d27 794 {
8ef5ada2
SK
795 union {
796 unsigned char *c;
797 struct in6_pktinfo *p;
798 } p;
799 p.c = CMSG_DATA(cmptr);
800
801 dst_addr.addr.addr6 = p.p->ipi6_addr;
802 if_index = p.p->ipi6_ifindex;
26128d27
SK
803 }
804 }
44a2a316 805#endif
26128d27
SK
806
807 /* enforce available interface configuration */
808
e25db1f2 809 if (!indextoname(listen->fd, if_index, ifr.ifr_name))
5e9e0efb 810 return;
832af0ba 811
e25db1f2
SK
812 if (!iface_check(listen->family, &dst_addr, ifr.ifr_name, &auth_dns))
813 {
814 if (!option_bool(OPT_CLEVERBIND))
115ac3e4 815 enumerate_interfaces(0);
3f2873d4
SK
816 if (!loopback_exception(listen->fd, listen->family, &dst_addr, ifr.ifr_name) &&
817 !label_exception(if_index, listen->family, &dst_addr))
e25db1f2
SK
818 return;
819 }
820
552af8b9
SK
821 if (listen->family == AF_INET && option_bool(OPT_LOCALISE))
822 {
823 struct irec *iface;
824
825 /* get the netmask of the interface whch has the address we were sent to.
826 This is no neccessarily the interface we arrived on. */
827
828 for (iface = daemon->interfaces; iface; iface = iface->next)
829 if (iface->addr.sa.sa_family == AF_INET &&
830 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
831 break;
832
833 /* interface may be new */
e25db1f2 834 if (!iface && !option_bool(OPT_CLEVERBIND))
115ac3e4 835 enumerate_interfaces(0);
552af8b9
SK
836
837 for (iface = daemon->interfaces; iface; iface = iface->next)
838 if (iface->addr.sa.sa_family == AF_INET &&
839 iface->addr.in.sin_addr.s_addr == dst_addr_4.s_addr)
840 break;
841
842 /* If we failed, abandon localisation */
843 if (iface)
844 netmask = iface->netmask;
845 else
846 dst_addr_4.s_addr = 0;
847 }
44a2a316
SK
848 }
849
cdeda28f 850 if (extract_request(header, (size_t)n, daemon->namebuff, &type))
44a2a316 851 {
1a6bca81 852 char types[20];
b485ed97
SK
853#ifdef HAVE_AUTH
854 struct auth_zone *zone;
855#endif
1a6bca81 856
4f7b304f 857 querystr(auth_dns ? "auth" : "query", types, type);
1a6bca81 858
44a2a316 859 if (listen->family == AF_INET)
3be34541 860 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
1a6bca81 861 (struct all_addr *)&source_addr.in.sin_addr, types);
44a2a316
SK
862#ifdef HAVE_IPV6
863 else
3be34541 864 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
1a6bca81 865 (struct all_addr *)&source_addr.in6.sin6_addr, types);
44a2a316 866#endif
44a2a316 867
b485ed97
SK
868#ifdef HAVE_AUTH
869 /* find queries for zones we're authoritative for, and answer them directly */
6008bdbb
SK
870 if (!auth_dns)
871 for (zone = daemon->auth_zones; zone; zone = zone->next)
872 if (in_zone(zone, daemon->namebuff, NULL))
873 {
874 auth_dns = 1;
875 local_auth = 1;
876 break;
877 }
b485ed97
SK
878#endif
879 }
880
4820dce9 881#ifdef HAVE_AUTH
4f7b304f 882 if (auth_dns)
824af85b 883 {
19b16891 884 m = answer_auth(header, ((char *) header) + PACKETSZ, (size_t)n, now, &source_addr, local_auth);
4f7b304f 885 if (m >= 1)
b485ed97
SK
886 {
887 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
888 (char *)header, m, &source_addr, &dst_addr, if_index);
889 daemon->auth_answer++;
890 }
824af85b 891 }
44a2a316 892 else
4820dce9 893#endif
4f7b304f
SK
894 {
895 m = answer_request(header, ((char *) header) + PACKETSZ, (size_t)n,
896 dst_addr_4, netmask, now);
897
898 if (m >= 1)
899 {
900 send_from(listen->fd, option_bool(OPT_NOWILD) || option_bool(OPT_CLEVERBIND),
901 (char *)header, m, &source_addr, &dst_addr, if_index);
902 daemon->local_answer++;
903 }
904 else if (forward_query(listen->fd, &source_addr, &dst_addr, if_index,
905 header, (size_t)n, now, NULL))
906 daemon->queries_forwarded++;
907 else
908 daemon->local_answer++;
909 }
44a2a316
SK
910}
911
feba5c1d
SK
912/* The daemon forks before calling this: it should deal with one connection,
913 blocking as neccessary, and then return. Note, need to be a bit careful
914 about resources for debug mode, when the fork is suppressed: that's
915 done by the caller. */
5aabfc78 916unsigned char *tcp_request(int confd, time_t now,
4f7b304f 917 union mysockaddr *local_addr, struct in_addr netmask, int auth_dns)
feba5c1d 918{
28866e95
SK
919 size_t size = 0;
920 int norebind = 0;
3b195961 921#ifdef HAVE_AUTH
19b16891 922 int local_auth = 0;
3b195961 923#endif
ed4c0767 924 int checking_disabled, check_subnet;
cdeda28f 925 size_t m;
ee86ce68
SK
926 unsigned short qtype;
927 unsigned int gotname;
feba5c1d 928 unsigned char c1, c2;
4b5ea12e
SK
929 /* Max TCP packet + slop + size */
930 unsigned char *packet = whine_malloc(65536 + MAXDNAME + RRFIXEDSZ + sizeof(u16));
931 unsigned char *payload = &packet[2];
932 /* largest field in header is 16-bits, so this is still sufficiently aligned */
933 struct dns_header *header = (struct dns_header *)payload;
934 u16 *length = (u16 *)packet;
3be34541 935 struct server *last_server;
7de060b0
SK
936 struct in_addr dst_addr_4;
937 union mysockaddr peer_addr;
938 socklen_t peer_len = sizeof(union mysockaddr);
3be34541 939
7de060b0
SK
940 if (getpeername(confd, (struct sockaddr *)&peer_addr, &peer_len) == -1)
941 return packet;
942
feba5c1d
SK
943 while (1)
944 {
945 if (!packet ||
946 !read_write(confd, &c1, 1, 1) || !read_write(confd, &c2, 1, 1) ||
947 !(size = c1 << 8 | c2) ||
4b5ea12e 948 !read_write(confd, payload, size, 1))
feba5c1d
SK
949 return packet;
950
572b41eb 951 if (size < (int)sizeof(struct dns_header))
feba5c1d
SK
952 continue;
953
ed4c0767
SK
954 check_subnet = 0;
955
28866e95 956 /* save state of "cd" flag in query */
572b41eb 957 checking_disabled = header->hb4 & HB4_CD;
28866e95
SK
958
959 /* RFC 4035: sect 4.6 para 2 */
572b41eb 960 header->hb4 &= ~HB4_AD;
feba5c1d 961
3be34541 962 if ((gotname = extract_request(header, (unsigned int)size, daemon->namebuff, &qtype)))
feba5c1d 963 {
7de060b0 964 char types[20];
b485ed97
SK
965#ifdef HAVE_AUTH
966 struct auth_zone *zone;
967#endif
4f7b304f 968 querystr(auth_dns ? "auth" : "query", types, qtype);
7de060b0
SK
969
970 if (peer_addr.sa.sa_family == AF_INET)
971 log_query(F_QUERY | F_IPV4 | F_FORWARD, daemon->namebuff,
972 (struct all_addr *)&peer_addr.in.sin_addr, types);
feba5c1d 973#ifdef HAVE_IPV6
7de060b0
SK
974 else
975 log_query(F_QUERY | F_IPV6 | F_FORWARD, daemon->namebuff,
976 (struct all_addr *)&peer_addr.in6.sin6_addr, types);
feba5c1d 977#endif
b485ed97
SK
978
979#ifdef HAVE_AUTH
980 /* find queries for zones we're authoritative for, and answer them directly */
6008bdbb
SK
981 if (!auth_dns)
982 for (zone = daemon->auth_zones; zone; zone = zone->next)
983 if (in_zone(zone, daemon->namebuff, NULL))
984 {
985 auth_dns = 1;
986 local_auth = 1;
987 break;
988 }
b485ed97 989#endif
feba5c1d
SK
990 }
991
7de060b0
SK
992 if (local_addr->sa.sa_family == AF_INET)
993 dst_addr_4 = local_addr->in.sin_addr;
994 else
995 dst_addr_4.s_addr = 0;
996
4820dce9 997#ifdef HAVE_AUTH
4f7b304f 998 if (auth_dns)
19b16891 999 m = answer_auth(header, ((char *) header) + 65536, (size_t)size, now, &peer_addr, local_auth);
4f7b304f 1000 else
4820dce9 1001#endif
feba5c1d 1002 {
4f7b304f
SK
1003 /* m > 0 if answered from cache */
1004 m = answer_request(header, ((char *) header) + 65536, (size_t)size,
1005 dst_addr_4, netmask, now);
feba5c1d 1006
4f7b304f
SK
1007 /* Do this by steam now we're not in the select() loop */
1008 check_log_writer(NULL);
1009
1010 if (m == 0)
feba5c1d 1011 {
4f7b304f
SK
1012 unsigned int flags = 0;
1013 struct all_addr *addrp = NULL;
1014 int type = 0;
1015 char *domain = NULL;
feba5c1d 1016
4f7b304f
SK
1017 if (option_bool(OPT_ADD_MAC))
1018 size = add_mac(header, size, ((char *) header) + 65536, &peer_addr);
ed4c0767
SK
1019
1020 if (option_bool(OPT_CLIENT_SUBNET))
1021 {
1022 size_t new = add_source_addr(header, size, ((char *) header) + 65536, &peer_addr);
1023 if (size != new)
1024 {
1025 size = new;
1026 check_subnet = 1;
1027 }
1028 }
1029
4f7b304f
SK
1030 if (gotname)
1031 flags = search_servers(now, &addrp, gotname, daemon->namebuff, &type, &domain, &norebind);
1032
1033 if (type != 0 || option_bool(OPT_ORDER) || !daemon->last_server)
1034 last_server = daemon->servers;
1035 else
1036 last_server = daemon->last_server;
1037
1038 if (!flags && last_server)
1039 {
1040 struct server *firstsendto = NULL;
1041 unsigned int crc = questions_crc(header, (unsigned int)size, daemon->namebuff);
1042
1043 /* Loop round available servers until we succeed in connecting to one.
1044 Note that this code subtley ensures that consecutive queries on this connection
1045 which can go to the same server, do so. */
1046 while (1)
feba5c1d 1047 {
4f7b304f
SK
1048 if (!firstsendto)
1049 firstsendto = last_server;
1050 else
1051 {
1052 if (!(last_server = last_server->next))
1053 last_server = daemon->servers;
1054
1055 if (last_server == firstsendto)
1056 break;
1057 }
1058
1059 /* server for wrong domain */
1060 if (type != (last_server->flags & SERV_TYPE) ||
1061 (type == SERV_HAS_DOMAIN && !hostname_isequal(domain, last_server->domain)))
7de060b0
SK
1062 continue;
1063
4f7b304f 1064 if (last_server->tcpfd == -1)
7de060b0 1065 {
4f7b304f
SK
1066 if ((last_server->tcpfd = socket(last_server->addr.sa.sa_family, SOCK_STREAM, 0)) == -1)
1067 continue;
1068
1069 if ((!local_bind(last_server->tcpfd, &last_server->source_addr, last_server->interface, 1) ||
1070 connect(last_server->tcpfd, &last_server->addr.sa, sa_len(&last_server->addr)) == -1))
1071 {
1072 close(last_server->tcpfd);
1073 last_server->tcpfd = -1;
1074 continue;
1075 }
1076
7de060b0 1077#ifdef HAVE_CONNTRACK
4f7b304f
SK
1078 /* Copy connection mark of incoming query to outgoing connection. */
1079 if (option_bool(OPT_CONNTRACK))
1080 {
1081 unsigned int mark;
1082 struct all_addr local;
7de060b0 1083#ifdef HAVE_IPV6
4f7b304f
SK
1084 if (local_addr->sa.sa_family == AF_INET6)
1085 local.addr.addr6 = local_addr->in6.sin6_addr;
1086 else
7de060b0 1087#endif
4f7b304f
SK
1088 local.addr.addr4 = local_addr->in.sin_addr;
1089
1090 if (get_incoming_mark(&peer_addr, &local, 1, &mark))
1091 setsockopt(last_server->tcpfd, SOL_SOCKET, SO_MARK, &mark, sizeof(unsigned int));
1092 }
7de060b0 1093#endif
4f7b304f
SK
1094 }
1095
4b5ea12e 1096 *length = htons(size);
4f7b304f 1097
4b5ea12e 1098 if (!read_write(last_server->tcpfd, packet, size + sizeof(u16), 0) ||
4f7b304f
SK
1099 !read_write(last_server->tcpfd, &c1, 1, 1) ||
1100 !read_write(last_server->tcpfd, &c2, 1, 1))
1101 {
1102 close(last_server->tcpfd);
1103 last_server->tcpfd = -1;
1104 continue;
1105 }
1106
1107 m = (c1 << 8) | c2;
4b5ea12e 1108 if (!read_write(last_server->tcpfd, payload, m, 1))
4f7b304f
SK
1109 return packet;
1110
1111 if (!gotname)
1112 strcpy(daemon->namebuff, "query");
1113 if (last_server->addr.sa.sa_family == AF_INET)
1114 log_query(F_SERVER | F_IPV4 | F_FORWARD, daemon->namebuff,
1115 (struct all_addr *)&last_server->addr.in.sin_addr, NULL);
feba5c1d 1116#ifdef HAVE_IPV6
4f7b304f
SK
1117 else
1118 log_query(F_SERVER | F_IPV6 | F_FORWARD, daemon->namebuff,
1119 (struct all_addr *)&last_server->addr.in6.sin6_addr, NULL);
feba5c1d 1120#endif
4f7b304f
SK
1121
1122 /* There's no point in updating the cache, since this process will exit and
1123 lose the information after a few queries. We make this call for the alias and
1124 bogus-nxdomain side-effects. */
1125 /* If the crc of the question section doesn't match the crc we sent, then
1126 someone might be attempting to insert bogus values into the cache by
1127 sending replies containing questions and bogus answers. */
1128 if (crc == questions_crc(header, (unsigned int)m, daemon->namebuff))
1129 m = process_reply(header, now, last_server, (unsigned int)m,
ed4c0767
SK
1130 option_bool(OPT_NO_REBIND) && !norebind, checking_disabled,
1131 check_subnet, &peer_addr);
4f7b304f
SK
1132
1133 break;
1134 }
feba5c1d 1135 }
4f7b304f
SK
1136
1137 /* In case of local answer or no connections made. */
1138 if (m == 0)
1139 m = setup_reply(header, (unsigned int)size, addrp, flags, daemon->local_ttl);
feba5c1d 1140 }
feba5c1d 1141 }
4f7b304f 1142
5aabfc78 1143 check_log_writer(NULL);
feba5c1d 1144
4b5ea12e
SK
1145 *length = htons(m);
1146
1147 if (m == 0 || !read_write(confd, packet, m + sizeof(u16), 0))
feba5c1d
SK
1148 return packet;
1149 }
1150}
1151
1697269c 1152static struct frec *allocate_frec(time_t now)
9e4abcb5 1153{
1697269c
SK
1154 struct frec *f;
1155
5aabfc78 1156 if ((f = (struct frec *)whine_malloc(sizeof(struct frec))))
9e4abcb5 1157 {
1a6bca81 1158 f->next = daemon->frec_list;
1697269c 1159 f->time = now;
832af0ba 1160 f->sentto = NULL;
1a6bca81 1161 f->rfd4 = NULL;
28866e95 1162 f->flags = 0;
1a6bca81
SK
1163#ifdef HAVE_IPV6
1164 f->rfd6 = NULL;
1165#endif
1166 daemon->frec_list = f;
1697269c 1167 }
9e4abcb5 1168
1697269c
SK
1169 return f;
1170}
9e4abcb5 1171
1a6bca81
SK
1172static struct randfd *allocate_rfd(int family)
1173{
1174 static int finger = 0;
1175 int i;
1176
1177 /* limit the number of sockets we have open to avoid starvation of
1178 (eg) TFTP. Once we have a reasonable number, randomness should be OK */
1179
1180 for (i = 0; i < RANDOM_SOCKS; i++)
9009d746 1181 if (daemon->randomsocks[i].refcount == 0)
1a6bca81 1182 {
9009d746
SK
1183 if ((daemon->randomsocks[i].fd = random_sock(family)) == -1)
1184 break;
1185
1a6bca81
SK
1186 daemon->randomsocks[i].refcount = 1;
1187 daemon->randomsocks[i].family = family;
1188 return &daemon->randomsocks[i];
1189 }
1190
9009d746 1191 /* No free ones or cannot get new socket, grab an existing one */
1a6bca81
SK
1192 for (i = 0; i < RANDOM_SOCKS; i++)
1193 {
1194 int j = (i+finger) % RANDOM_SOCKS;
9009d746
SK
1195 if (daemon->randomsocks[j].refcount != 0 &&
1196 daemon->randomsocks[j].family == family &&
1197 daemon->randomsocks[j].refcount != 0xffff)
1a6bca81
SK
1198 {
1199 finger = j;
1200 daemon->randomsocks[j].refcount++;
1201 return &daemon->randomsocks[j];
1202 }
1203 }
1204
1205 return NULL; /* doom */
1206}
1207
1208static void free_frec(struct frec *f)
1209{
1210 if (f->rfd4 && --(f->rfd4->refcount) == 0)
1211 close(f->rfd4->fd);
1212
1213 f->rfd4 = NULL;
1214 f->sentto = NULL;
28866e95 1215 f->flags = 0;
1a6bca81
SK
1216
1217#ifdef HAVE_IPV6
1218 if (f->rfd6 && --(f->rfd6->refcount) == 0)
1219 close(f->rfd6->fd);
1220
1221 f->rfd6 = NULL;
1222#endif
1223}
1224
1697269c
SK
1225/* if wait==NULL return a free or older than TIMEOUT record.
1226 else return *wait zero if one available, or *wait is delay to
1a6bca81
SK
1227 when the oldest in-use record will expire. Impose an absolute
1228 limit of 4*TIMEOUT before we wipe things (for random sockets) */
5aabfc78 1229struct frec *get_new_frec(time_t now, int *wait)
1697269c 1230{
1a6bca81 1231 struct frec *f, *oldest, *target;
1697269c
SK
1232 int count;
1233
1234 if (wait)
1235 *wait = 0;
1236
1a6bca81 1237 for (f = daemon->frec_list, oldest = NULL, target = NULL, count = 0; f; f = f->next, count++)
832af0ba 1238 if (!f->sentto)
1a6bca81
SK
1239 target = f;
1240 else
1697269c 1241 {
1a6bca81
SK
1242 if (difftime(now, f->time) >= 4*TIMEOUT)
1243 {
1244 free_frec(f);
1245 target = f;
1246 }
1247
1248 if (!oldest || difftime(f->time, oldest->time) <= 0)
1249 oldest = f;
1697269c 1250 }
1a6bca81
SK
1251
1252 if (target)
1253 {
1254 target->time = now;
1255 return target;
1256 }
9e4abcb5
SK
1257
1258 /* can't find empty one, use oldest if there is one
1259 and it's older than timeout */
1697269c 1260 if (oldest && ((int)difftime(now, oldest->time)) >= TIMEOUT)
9e4abcb5 1261 {
1697269c
SK
1262 /* keep stuff for twice timeout if we can by allocating a new
1263 record instead */
1264 if (difftime(now, oldest->time) < 2*TIMEOUT &&
1265 count <= daemon->ftabsize &&
1266 (f = allocate_frec(now)))
1267 return f;
1268
1269 if (!wait)
1270 {
1a6bca81 1271 free_frec(oldest);
1697269c
SK
1272 oldest->time = now;
1273 }
9e4abcb5
SK
1274 return oldest;
1275 }
1276
1697269c 1277 /* none available, calculate time 'till oldest record expires */
208b65c5 1278 if (count > daemon->ftabsize)
1697269c 1279 {
0da5e897
MSB
1280 static time_t last_log = 0;
1281
1697269c
SK
1282 if (oldest && wait)
1283 *wait = oldest->time + (time_t)TIMEOUT - now;
0da5e897
MSB
1284
1285 if ((int)difftime(now, last_log) > 5)
1286 {
1287 last_log = now;
1288 my_syslog(LOG_WARNING, _("Maximum number of concurrent DNS queries reached (max: %d)"), daemon->ftabsize);
1289 }
1290
9e4abcb5
SK
1291 return NULL;
1292 }
1697269c
SK
1293
1294 if (!(f = allocate_frec(now)) && wait)
1295 /* wait one second on malloc failure */
1296 *wait = 1;
9e4abcb5 1297
9e4abcb5
SK
1298 return f; /* OK if malloc fails and this is NULL */
1299}
1300
832af0ba
SK
1301/* crc is all-ones if not known. */
1302static struct frec *lookup_frec(unsigned short id, unsigned int crc)
9e4abcb5
SK
1303{
1304 struct frec *f;
1305
1a6bca81 1306 for(f = daemon->frec_list; f; f = f->next)
832af0ba
SK
1307 if (f->sentto && f->new_id == id &&
1308 (f->crc == crc || crc == 0xffffffff))
9e4abcb5
SK
1309 return f;
1310
1311 return NULL;
1312}
1313
1314static struct frec *lookup_frec_by_sender(unsigned short id,
fd9fa481
SK
1315 union mysockaddr *addr,
1316 unsigned int crc)
9e4abcb5 1317{
feba5c1d
SK
1318 struct frec *f;
1319
1a6bca81 1320 for(f = daemon->frec_list; f; f = f->next)
832af0ba 1321 if (f->sentto &&
9e4abcb5 1322 f->orig_id == id &&
fd9fa481 1323 f->crc == crc &&
9e4abcb5
SK
1324 sockaddr_isequal(&f->source, addr))
1325 return f;
1326
1327 return NULL;
1328}
1329
849a8357 1330/* A server record is going away, remove references to it */
5aabfc78 1331void server_gone(struct server *server)
849a8357
SK
1332{
1333 struct frec *f;
1334
1a6bca81 1335 for (f = daemon->frec_list; f; f = f->next)
832af0ba 1336 if (f->sentto && f->sentto == server)
1a6bca81 1337 free_frec(f);
849a8357
SK
1338
1339 if (daemon->last_server == server)
1340 daemon->last_server = NULL;
1341
1342 if (daemon->srv_save == server)
1343 daemon->srv_save = NULL;
1344}
9e4abcb5 1345
316e2730
SK
1346/* return unique random ids. */
1347static unsigned short get_id(unsigned int crc)
9e4abcb5
SK
1348{
1349 unsigned short ret = 0;
832af0ba 1350
316e2730 1351 do
832af0ba
SK
1352 ret = rand16();
1353 while (lookup_frec(ret, crc));
1354
9e4abcb5
SK
1355 return ret;
1356}
1357
1358
1359
1360
1361