resolv/res_send.c

   1 /* Copyright (C) 2016-2019 Free Software Foundation, Inc.
   2    This file is part of the GNU C Library.
   3
   4    The GNU C Library is free software; you can redistribute it and/or
   5    modify it under the terms of the GNU Lesser General Public
   6    License as published by the Free Software Foundation; either
   7    version 2.1 of the License, or (at your option) any later version.
   8
   9    The GNU C Library is distributed in the hope that it will be useful,
  10    but WITHOUT ANY WARRANTY; without even the implied warranty of
  11    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  12    Lesser General Public License for more details.
  13
  14    You should have received a copy of the GNU Lesser General Public
  15    License along with the GNU C Library; if not, see
  16    <http://www.gnu.org/licenses/>.  */
  17
  18 /*
  19  * Copyright (c) 1985, 1989, 1993
  20  *    The Regents of the University of California.  All rights reserved.
  21  *
  22  * Redistribution and use in source and binary forms, with or without
  23  * modification, are permitted provided that the following conditions
  24  * are met:
  25  * 1. Redistributions of source code must retain the above copyright
  26  *    notice, this list of conditions and the following disclaimer.
  27  * 2. Redistributions in binary form must reproduce the above copyright
  28  *    notice, this list of conditions and the following disclaimer in the
  29  *    documentation and/or other materials provided with the distribution.
  30  * 4. Neither the name of the University nor the names of its contributors
  31  *    may be used to endorse or promote products derived from this software
  32  *    without specific prior written permission.
  33  *
  34  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
  35  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  36  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  37  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  38  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  39  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  40  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  41  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  42  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  43  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  44  * SUCH DAMAGE.
  45  */
  46
  47 /*
  48  * Portions Copyright (c) 1993 by Digital Equipment Corporation.
  49  *
  50  * Permission to use, copy, modify, and distribute this software for any
  51  * purpose with or without fee is hereby granted, provided that the above
  52  * copyright notice and this permission notice appear in all copies, and that
  53  * the name of Digital Equipment Corporation not be used in advertising or
  54  * publicity pertaining to distribution of the document or software without
  55  * specific, written prior permission.
  56  *
  57  * THE SOFTWARE IS PROVIDED "AS IS" AND DIGITAL EQUIPMENT CORP. DISCLAIMS ALL
  58  * WARRANTIES WITH REGARD TO THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES
  59  * OF MERCHANTABILITY AND FITNESS.   IN NO EVENT SHALL DIGITAL EQUIPMENT
  60  * CORPORATION BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL
  61  * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
  62  * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS
  63  * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS
  64  * SOFTWARE.
  65  */
  66
  67 /*
  68  * Portions Copyright (c) 1996-1999 by Internet Software Consortium.
  69  *
  70  * Permission to use, copy, modify, and distribute this software for any
  71  * purpose with or without fee is hereby granted, provided that the above
  72  * copyright notice and this permission notice appear in all copies.
  73  *
  74  * THE SOFTWARE IS PROVIDED "AS IS" AND INTERNET SOFTWARE CONSORTIUM DISCLAIMS
  75  * ALL WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES
  76  * OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL INTERNET SOFTWARE
  77  * CONSORTIUM BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL
  78  * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
  79  * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS
  80  * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS
  81  * SOFTWARE.
  82  */
  83
  84 /*
  85  * Send query to name server and wait for reply.
  86  */
  87
  88 #include <assert.h>
  89 #include <sys/types.h>
  90 #include <sys/param.h>
  91 #include <sys/time.h>
  92 #include <sys/socket.h>
  93 #include <sys/uio.h>
  94 #include <sys/poll.h>
  95
  96 #include <netinet/in.h>
  97 #include <arpa/nameser.h>
  98 #include <arpa/inet.h>
  99 #include <sys/ioctl.h>
 100
 101 #include <errno.h>
 102 #include <fcntl.h>
 103 #include <netdb.h>
 104 #include <resolv/resolv-internal.h>
 105 #include <resolv/resolv_context.h>
 106 #include <signal.h>
 107 #include <stdlib.h>
 108 #include <string.h>
 109 #include <unistd.h>
 110 #include <kernel-features.h>
 111 #include <libc-diag.h>
 112 #include <random-bits.h>
 113
 114 #if PACKETSZ > 65536
 115 #define MAXPACKET       PACKETSZ
 116 #else
 117 #define MAXPACKET       65536
 118 #endif
 119
 120 /* From ev_streams.c.  */
 121
 122 static inline void
 123 __attribute ((always_inline))
 124 evConsIovec(void *buf, size_t cnt, struct iovec *vec) {
 125         memset(vec, 0xf5, sizeof (*vec));
 126         vec->iov_base = buf;
 127         vec->iov_len = cnt;
 128 }
 129
 130 /* From ev_timers.c.  */
 131
 132 #define BILLION 1000000000
 133
 134 static inline void
 135 evConsTime(struct timespec *res, time_t sec, long nsec) {
 136         res->tv_sec = sec;
 137         res->tv_nsec = nsec;
 138 }
 139
 140 static inline void
 141 evAddTime(struct timespec *res, const struct timespec *addend1,
 142           const struct timespec *addend2) {
 143         res->tv_sec = addend1->tv_sec + addend2->tv_sec;
 144         res->tv_nsec = addend1->tv_nsec + addend2->tv_nsec;
 145         if (res->tv_nsec >= BILLION) {
 146                 res->tv_sec++;
 147                 res->tv_nsec -= BILLION;
 148         }
 149 }
 150
 151 static inline void
 152 evSubTime(struct timespec *res, const struct timespec *minuend,
 153           const struct timespec *subtrahend) {
 154        res->tv_sec = minuend->tv_sec - subtrahend->tv_sec;
 155         if (minuend->tv_nsec >= subtrahend->tv_nsec)
 156                 res->tv_nsec = minuend->tv_nsec - subtrahend->tv_nsec;
 157         else {
 158                 res->tv_nsec = (BILLION
 159                                 - subtrahend->tv_nsec + minuend->tv_nsec);
 160                 res->tv_sec--;
 161         }
 162 }
 163
 164 static int
 165 evCmpTime(struct timespec a, struct timespec b) {
 166         long x = a.tv_sec - b.tv_sec;
 167
 168         if (x == 0L)
 169                 x = a.tv_nsec - b.tv_nsec;
 170         return (x < 0L ? (-1) : x > 0L ? (1) : (0));
 171 }
 172
 173 static void
 174 evNowTime(struct timespec *res) {
 175         struct timeval now;
 176
 177         if (gettimeofday(&now, NULL) < 0)
 178                 evConsTime(res, 0, 0);
 179         else
 180                 TIMEVAL_TO_TIMESPEC (&now, res);
 181 }
 182
 183
 184 #define EXT(res) ((res)->_u._ext)
 185
 186 /* Forward. */
 187
 188 static struct sockaddr *get_nsaddr (res_state, unsigned int);
 189 static int              send_vc(res_state, const u_char *, int,
 190                                 const u_char *, int,
 191                                 u_char **, int *, int *, int, u_char **,
 192                                 u_char **, int *, int *, int *);
 193 static int              send_dg(res_state, const u_char *, int,
 194                                 const u_char *, int,
 195                                 u_char **, int *, int *, int,
 196                                 int *, int *, u_char **,
 197                                 u_char **, int *, int *, int *);
 198 static int              sock_eq(struct sockaddr_in6 *, struct sockaddr_in6 *);
 199
 200 /* Public. */
 201
 202 /* int
 203  * res_isourserver(ina)
 204  *      looks up "ina" in _res.ns_addr_list[]
 205  * returns:
 206  *      0  : not found
 207  *      >0 : found
 208  * author:
 209  *      paul vixie, 29may94
 210  */
 211 int
 212 res_ourserver_p(const res_state statp, const struct sockaddr_in6 *inp)
 213 {
 214         int ns;
 215
 216         if (inp->sin6_family == AF_INET) {
 217             struct sockaddr_in *in4p = (struct sockaddr_in *) inp;
 218             in_port_t port = in4p->sin_port;
 219             in_addr_t addr = in4p->sin_addr.s_addr;
 220
 221             for (ns = 0;  ns < statp->nscount;  ns++) {
 222                 const struct sockaddr_in *srv =
 223                     (struct sockaddr_in *) get_nsaddr (statp, ns);
 224
 225                 if ((srv->sin_family == AF_INET) &&
 226                     (srv->sin_port == port) &&
 227                     (srv->sin_addr.s_addr == INADDR_ANY ||
 228                      srv->sin_addr.s_addr == addr))
 229                     return (1);
 230             }
 231         } else if (inp->sin6_family == AF_INET6) {
 232             for (ns = 0;  ns < statp->nscount;  ns++) {
 233                 const struct sockaddr_in6 *srv
 234                   = (struct sockaddr_in6 *) get_nsaddr (statp, ns);
 235                 if ((srv->sin6_family == AF_INET6) &&
 236                     (srv->sin6_port == inp->sin6_port) &&
 237                     !(memcmp(&srv->sin6_addr, &in6addr_any,
 238                              sizeof (struct in6_addr)) &&
 239                       memcmp(&srv->sin6_addr, &inp->sin6_addr,
 240                              sizeof (struct in6_addr))))
 241                     return (1);
 242             }
 243         }
 244         return (0);
 245 }
 246
 247 int
 248 res_isourserver (const struct sockaddr_in *inp)
 249 {
 250   return res_ourserver_p (&_res, (const struct sockaddr_in6 *) inp);
 251 }
 252
 253 /* int
 254  * res_nameinquery(name, type, class, buf, eom)
 255  *      look for (name,type,class) in the query section of packet (buf,eom)
 256  * requires:
 257  *      buf + HFIXEDSZ <= eom
 258  * returns:
 259  *      -1 : format error
 260  *      0  : not found
 261  *      >0 : found
 262  * author:
 263  *      paul vixie, 29may94
 264  */
 265 int
 266 res_nameinquery(const char *name, int type, int class,
 267                 const u_char *buf, const u_char *eom)
 268 {
 269         const u_char *cp = buf + HFIXEDSZ;
 270         int qdcount = ntohs(((HEADER*)buf)->qdcount);
 271
 272         while (qdcount-- > 0) {
 273                 char tname[MAXDNAME+1];
 274                 int n, ttype, tclass;
 275
 276                 n = dn_expand(buf, eom, cp, tname, sizeof tname);
 277                 if (n < 0)
 278                         return (-1);
 279                 cp += n;
 280                 if (cp + 2 * INT16SZ > eom)
 281                         return (-1);
 282                 NS_GET16(ttype, cp);
 283                 NS_GET16(tclass, cp);
 284                 if (ttype == type && tclass == class &&
 285                     ns_samename(tname, name) == 1)
 286                         return (1);
 287         }
 288         return (0);
 289 }
 290 libresolv_hidden_def (res_nameinquery)
 291
 292 /* Returns a shift value for the name server index.  Used to implement
 293    RES_ROTATE.  */
 294 static unsigned int
 295 nameserver_offset (struct __res_state *statp)
 296 {
 297   /* If we only have one name server or rotation is disabled, return
 298      offset 0 (no rotation).  */
 299   unsigned int nscount = statp->nscount;
 300   if (nscount <= 1 || !(statp->options & RES_ROTATE))
 301     return 0;
 302
 303   /* Global offset.  The lowest bit indicates whether the offset has
 304      been initialized with a random value.  Use relaxed MO to access
 305      global_offset because all we need is a sequence of roughly
 306      sequential value.  */
 307   static unsigned int global_offset;
 308   unsigned int offset = atomic_fetch_add_relaxed (&global_offset, 2);
 309   if ((offset & 1) == 0)
 310     {
 311       /* Initialization is required.  */
 312       offset = random_bits ();
 313       /* The lowest bit is the most random.  Preserve it.  */
 314       offset <<= 1;
 315
 316       /* Store the new starting value.  atomic_fetch_add_relaxed
 317          returns the old value, so emulate that by storing the new
 318          (incremented) value.  Concurrent initialization with
 319          different random values is harmless.  */
 320       atomic_store_relaxed (&global_offset, (offset | 1) + 2);
 321     }
 322
 323   /* Remove the initialization bit.  */
 324   offset >>= 1;
 325
 326   /* Avoid the division in the most common cases.  */
 327   switch (nscount)
 328     {
 329     case 2:
 330       return offset & 1;
 331     case 3:
 332       return offset % 3;
 333     case 4:
 334       return offset & 3;
 335     default:
 336       return offset % nscount;
 337     }
 338 }
 339
 340 /* int
 341  * res_queriesmatch(buf1, eom1, buf2, eom2)
 342  *      is there a 1:1 mapping of (name,type,class)
 343  *      in (buf1,eom1) and (buf2,eom2)?
 344  * returns:
 345  *      -1 : format error
 346  *      0  : not a 1:1 mapping
 347  *      >0 : is a 1:1 mapping
 348  * author:
 349  *      paul vixie, 29may94
 350  */
 351 int
 352 res_queriesmatch(const u_char *buf1, const u_char *eom1,
 353                  const u_char *buf2, const u_char *eom2)
 354 {
 355         if (buf1 + HFIXEDSZ > eom1 || buf2 + HFIXEDSZ > eom2)
 356                 return (-1);
 357
 358         /*
 359          * Only header section present in replies to
 360          * dynamic update packets.
 361          */
 362         if ((((HEADER *)buf1)->opcode == ns_o_update) &&
 363             (((HEADER *)buf2)->opcode == ns_o_update))
 364                 return (1);
 365
 366         /* Note that we initially do not convert QDCOUNT to the host byte
 367            order.  We can compare it with the second buffer's QDCOUNT
 368            value without doing this.  */
 369         int qdcount = ((HEADER*)buf1)->qdcount;
 370         if (qdcount != ((HEADER*)buf2)->qdcount)
 371                 return (0);
 372
 373         qdcount = htons (qdcount);
 374         const u_char *cp = buf1 + HFIXEDSZ;
 375
 376         while (qdcount-- > 0) {
 377                 char tname[MAXDNAME+1];
 378                 int n, ttype, tclass;
 379
 380                 n = dn_expand(buf1, eom1, cp, tname, sizeof tname);
 381                 if (n < 0)
 382                         return (-1);
 383                 cp += n;
 384                 if (cp + 2 * INT16SZ > eom1)
 385                         return (-1);
 386                 NS_GET16(ttype, cp);
 387                 NS_GET16(tclass, cp);
 388                 if (!res_nameinquery(tname, ttype, tclass, buf2, eom2))
 389                         return (0);
 390         }
 391         return (1);
 392 }
 393 libresolv_hidden_def (res_queriesmatch)
 394
 395 int
 396 __res_context_send (struct resolv_context *ctx,
 397                     const unsigned char *buf, int buflen,
 398                     const unsigned char *buf2, int buflen2,
 399                     unsigned char *ans, int anssiz,
 400                     unsigned char **ansp, unsigned char **ansp2,
 401                     int *nansp2, int *resplen2, int *ansp2_malloced)
 402 {
 403         struct __res_state *statp = ctx->resp;
 404         int gotsomewhere, terrno, try, v_circuit, resplen, n;
 405
 406         if (statp->nscount == 0) {
 407                 __set_errno (ESRCH);
 408                 return (-1);
 409         }
 410
 411         if (anssiz < (buf2 == NULL ? 1 : 2) * HFIXEDSZ) {
 412                 __set_errno (EINVAL);
 413                 return (-1);
 414         }
 415
 416         v_circuit = ((statp->options & RES_USEVC)
 417                      || buflen > PACKETSZ
 418                      || buflen2 > PACKETSZ);
 419         gotsomewhere = 0;
 420         terrno = ETIMEDOUT;
 421
 422         /*
 423          * If the ns_addr_list in the resolver context has changed, then
 424          * invalidate our cached copy and the associated timing data.
 425          */
 426         if (EXT(statp).nscount != 0) {
 427                 int needclose = 0;
 428
 429                 if (EXT(statp).nscount != statp->nscount)
 430                         needclose++;
 431                 else
 432                         for (unsigned int ns = 0; ns < statp->nscount; ns++) {
 433                                 if (statp->nsaddr_list[ns].sin_family != 0
 434                                     && !sock_eq((struct sockaddr_in6 *)
 435                                                 &statp->nsaddr_list[ns],
 436                                                 EXT(statp).nsaddrs[ns]))
 437                                 {
 438                                         needclose++;
 439                                         break;
 440                                 }
 441                         }
 442                 if (needclose) {
 443                         __res_iclose(statp, false);
 444                         EXT(statp).nscount = 0;
 445                 }
 446         }
 447
 448         /*
 449          * Maybe initialize our private copy of the ns_addr_list.
 450          */
 451         if (EXT(statp).nscount == 0) {
 452                 for (unsigned int ns = 0; ns < statp->nscount; ns++) {
 453                         EXT(statp).nssocks[ns] = -1;
 454                         if (statp->nsaddr_list[ns].sin_family == 0)
 455                                 continue;
 456                         if (EXT(statp).nsaddrs[ns] == NULL)
 457                                 EXT(statp).nsaddrs[ns] =
 458                                     malloc(sizeof (struct sockaddr_in6));
 459                         if (EXT(statp).nsaddrs[ns] != NULL)
 460                                 memset (mempcpy(EXT(statp).nsaddrs[ns],
 461                                                 &statp->nsaddr_list[ns],
 462                                                 sizeof (struct sockaddr_in)),
 463                                         '\0',
 464                                         sizeof (struct sockaddr_in6)
 465                                         - sizeof (struct sockaddr_in));
 466                         else
 467                                 return -1;
 468                 }
 469                 EXT(statp).nscount = statp->nscount;
 470         }
 471
 472         /* Name server index offset.  Used to implement
 473            RES_ROTATE.  */
 474         unsigned int ns_offset = nameserver_offset (statp);
 475
 476         /*
 477          * Send request, RETRY times, or until successful.
 478          */
 479         for (try = 0; try < statp->retry; try++) {
 480             for (unsigned ns_shift = 0; ns_shift < statp->nscount; ns_shift++)
 481             {
 482                 /* The actual name server index.  This implements
 483                    RES_ROTATE.  */
 484                 unsigned int ns = ns_shift + ns_offset;
 485                 if (ns >= statp->nscount)
 486                         ns -= statp->nscount;
 487
 488             same_ns:
 489                 if (__glibc_unlikely (v_circuit))       {
 490                         /* Use VC; at most one attempt per server. */
 491                         try = statp->retry;
 492                         n = send_vc(statp, buf, buflen, buf2, buflen2,
 493                                     &ans, &anssiz, &terrno,
 494                                     ns, ansp, ansp2, nansp2, resplen2,
 495                                     ansp2_malloced);
 496                         if (n < 0)
 497                                 return (-1);
 498                         if (n == 0 && (buf2 == NULL || *resplen2 == 0))
 499                                 goto next_ns;
 500                 } else {
 501                         /* Use datagrams. */
 502                         n = send_dg(statp, buf, buflen, buf2, buflen2,
 503                                     &ans, &anssiz, &terrno,
 504                                     ns, &v_circuit, &gotsomewhere, ansp,
 505                                     ansp2, nansp2, resplen2, ansp2_malloced);
 506                         if (n < 0)
 507                                 return (-1);
 508                         if (n == 0 && (buf2 == NULL || *resplen2 == 0))
 509                                 goto next_ns;
 510                         if (v_circuit)
 511                           // XXX Check whether both requests failed or
 512                           // XXX whether one has been answered successfully
 513                                 goto same_ns;
 514                 }
 515
 516                 resplen = n;
 517
 518                 /*
 519                  * If we have temporarily opened a virtual circuit,
 520                  * or if we haven't been asked to keep a socket open,
 521                  * close the socket.
 522                  */
 523                 if ((v_circuit && (statp->options & RES_USEVC) == 0) ||
 524                     (statp->options & RES_STAYOPEN) == 0) {
 525                         __res_iclose(statp, false);
 526                 }
 527                 return (resplen);
 528  next_ns: ;
 529            } /*foreach ns*/
 530         } /*foreach retry*/
 531         __res_iclose(statp, false);
 532         if (!v_circuit) {
 533                 if (!gotsomewhere)
 534                         __set_errno (ECONNREFUSED);     /* no nameservers found */
 535                 else
 536                         __set_errno (ETIMEDOUT);        /* no answer obtained */
 537         } else
 538                 __set_errno (terrno);
 539         return (-1);
 540 }
 541
 542 /* Common part of res_nsend and res_send.  */
 543 static int
 544 context_send_common (struct resolv_context *ctx,
 545                      const unsigned char *buf, int buflen,
 546                      unsigned char *ans, int anssiz)
 547 {
 548   if (ctx == NULL)
 549     {
 550       RES_SET_H_ERRNO (&_res, NETDB_INTERNAL);
 551       return -1;
 552     }
 553   int result = __res_context_send (ctx, buf, buflen, NULL, 0, ans, anssiz,
 554                                    NULL, NULL, NULL, NULL, NULL);
 555   __resolv_context_put (ctx);
 556   return result;
 557 }
 558
 559 int
 560 res_nsend (res_state statp, const unsigned char *buf, int buflen,
 561            unsigned char *ans, int anssiz)
 562 {
 563   return context_send_common
 564     (__resolv_context_get_override (statp), buf, buflen, ans, anssiz);
 565 }
 566
 567 int
 568 res_send (const unsigned char *buf, int buflen, unsigned char *ans, int anssiz)
 569 {
 570   return context_send_common
 571     (__resolv_context_get (), buf, buflen, ans, anssiz);
 572 }
 573
 574 /* Private */
 575
 576 static struct sockaddr *
 577 get_nsaddr (res_state statp, unsigned int n)
 578 {
 579   assert (n < statp->nscount);
 580
 581   if (statp->nsaddr_list[n].sin_family == 0 && EXT(statp).nsaddrs[n] != NULL)
 582     /* EXT(statp).nsaddrs[n] holds an address that is larger than
 583        struct sockaddr, and user code did not update
 584        statp->nsaddr_list[n].  */
 585     return (struct sockaddr *) EXT(statp).nsaddrs[n];
 586   else
 587     /* User code updated statp->nsaddr_list[n], or statp->nsaddr_list[n]
 588        has the same content as EXT(statp).nsaddrs[n].  */
 589     return (struct sockaddr *) (void *) &statp->nsaddr_list[n];
 590 }
 591
 592 /* Close the resolver structure, assign zero to *RESPLEN2 if RESPLEN2
 593    is not NULL, and return zero.  */
 594 static int
 595 __attribute__ ((warn_unused_result))
 596 close_and_return_error (res_state statp, int *resplen2)
 597 {
 598   __res_iclose(statp, false);
 599   if (resplen2 != NULL)
 600     *resplen2 = 0;
 601   return 0;
 602 }
 603
 604 /* The send_vc function is responsible for sending a DNS query over TCP
 605    to the nameserver numbered NS from the res_state STATP i.e.
 606    EXT(statp).nssocks[ns].  The function supports sending both IPv4 and
 607    IPv6 queries at the same serially on the same socket.
 608
 609    Please note that for TCP there is no way to disable sending both
 610    queries, unlike UDP, which honours RES_SNGLKUP and RES_SNGLKUPREOP
 611    and sends the queries serially and waits for the result after each
 612    sent query.  This implementation should be corrected to honour these
 613    options.
 614
 615    Please also note that for TCP we send both queries over the same
 616    socket one after another.  This technically violates best practice
 617    since the server is allowed to read the first query, respond, and
 618    then close the socket (to service another client).  If the server
 619    does this, then the remaining second query in the socket data buffer
 620    will cause the server to send the client an RST which will arrive
 621    asynchronously and the client's OS will likely tear down the socket
 622    receive buffer resulting in a potentially short read and lost
 623    response data.  This will force the client to retry the query again,
 624    and this process may repeat until all servers and connection resets
 625    are exhausted and then the query will fail.  It's not known if this
 626    happens with any frequency in real DNS server implementations.  This
 627    implementation should be corrected to use two sockets by default for
 628    parallel queries.
 629
 630    The query stored in BUF of BUFLEN length is sent first followed by
 631    the query stored in BUF2 of BUFLEN2 length.  Queries are sent
 632    serially on the same socket.
 633
 634    Answers to the query are stored firstly in *ANSP up to a max of
 635    *ANSSIZP bytes.  If more than *ANSSIZP bytes are needed and ANSCP
 636    is non-NULL (to indicate that modifying the answer buffer is allowed)
 637    then malloc is used to allocate a new response buffer and ANSCP and
 638    ANSP will both point to the new buffer.  If more than *ANSSIZP bytes
 639    are needed but ANSCP is NULL, then as much of the response as
 640    possible is read into the buffer, but the results will be truncated.
 641    When truncation happens because of a small answer buffer the DNS
 642    packets header field TC will bet set to 1, indicating a truncated
 643    message and the rest of the socket data will be read and discarded.
 644
 645    Answers to the query are stored secondly in *ANSP2 up to a max of
 646    *ANSSIZP2 bytes, with the actual response length stored in
 647    *RESPLEN2.  If more than *ANSSIZP bytes are needed and ANSP2
 648    is non-NULL (required for a second query) then malloc is used to
 649    allocate a new response buffer, *ANSSIZP2 is set to the new buffer
 650    size and *ANSP2_MALLOCED is set to 1.
 651
 652    The ANSP2_MALLOCED argument will eventually be removed as the
 653    change in buffer pointer can be used to detect the buffer has
 654    changed and that the caller should use free on the new buffer.
 655
 656    Note that the answers may arrive in any order from the server and
 657    therefore the first and second answer buffers may not correspond to
 658    the first and second queries.
 659
 660    It is not supported to call this function with a non-NULL ANSP2
 661    but a NULL ANSCP.  Put another way, you can call send_vc with a
 662    single unmodifiable buffer or two modifiable buffers, but no other
 663    combination is supported.
 664
 665    It is the caller's responsibility to free the malloc allocated
 666    buffers by detecting that the pointers have changed from their
 667    original values i.e. *ANSCP or *ANSP2 has changed.
 668
 669    If errors are encountered then *TERRNO is set to an appropriate
 670    errno value and a zero result is returned for a recoverable error,
 671    and a less-than zero result is returned for a non-recoverable error.
 672
 673    If no errors are encountered then *TERRNO is left unmodified and
 674    a the length of the first response in bytes is returned.  */
 675 static int
 676 send_vc(res_state statp,
 677         const u_char *buf, int buflen, const u_char *buf2, int buflen2,
 678         u_char **ansp, int *anssizp,
 679         int *terrno, int ns, u_char **anscp, u_char **ansp2, int *anssizp2,
 680         int *resplen2, int *ansp2_malloced)
 681 {
 682         const HEADER *hp = (HEADER *) buf;
 683         const HEADER *hp2 = (HEADER *) buf2;
 684         HEADER *anhp = (HEADER *) *ansp;
 685         struct sockaddr *nsap = get_nsaddr (statp, ns);
 686         int truncating, connreset, n;
 687         /* On some architectures compiler might emit a warning indicating
 688            'resplen' may be used uninitialized.  However if buf2 == NULL
 689            then this code won't be executed; if buf2 != NULL, then first
 690            time round the loop recvresp1 and recvresp2 will be 0 so this
 691            code won't be executed but "thisresplenp = &resplen;" followed
 692            by "*thisresplenp = rlen;" will be executed so that subsequent
 693            times round the loop resplen has been initialized.  So this is
 694            a false-positive.
 695          */
 696         DIAG_PUSH_NEEDS_COMMENT;
 697         DIAG_IGNORE_NEEDS_COMMENT (5, "-Wmaybe-uninitialized");
 698         int resplen;
 699         DIAG_POP_NEEDS_COMMENT;
 700         struct iovec iov[4];
 701         u_short len;
 702         u_short len2;
 703         u_char *cp;
 704
 705         connreset = 0;
 706  same_ns:
 707         truncating = 0;
 708
 709         /* Are we still talking to whom we want to talk to? */
 710         if (statp->_vcsock >= 0 && (statp->_flags & RES_F_VC) != 0) {
 711                 struct sockaddr_in6 peer;
 712                 socklen_t size = sizeof peer;
 713
 714                 if (getpeername(statp->_vcsock,
 715                                 (struct sockaddr *)&peer, &size) < 0 ||
 716                     !sock_eq(&peer, (struct sockaddr_in6 *) nsap)) {
 717                         __res_iclose(statp, false);
 718                         statp->_flags &= ~RES_F_VC;
 719                 }
 720         }
 721
 722         if (statp->_vcsock < 0 || (statp->_flags & RES_F_VC) == 0) {
 723                 if (statp->_vcsock >= 0)
 724                   __res_iclose(statp, false);
 725
 726                 statp->_vcsock = socket
 727                   (nsap->sa_family, SOCK_STREAM | SOCK_CLOEXEC, 0);
 728                 if (statp->_vcsock < 0) {
 729                         *terrno = errno;
 730                         if (resplen2 != NULL)
 731                           *resplen2 = 0;
 732                         return (-1);
 733                 }
 734                 __set_errno (0);
 735                 if (connect(statp->_vcsock, nsap,
 736                             nsap->sa_family == AF_INET
 737                             ? sizeof (struct sockaddr_in)
 738                             : sizeof (struct sockaddr_in6)) < 0) {
 739                         *terrno = errno;
 740                         return close_and_return_error (statp, resplen2);
 741                 }
 742                 statp->_flags |= RES_F_VC;
 743         }
 744
 745         /*
 746          * Send length & message
 747          */
 748         len = htons ((u_short) buflen);
 749         evConsIovec(&len, INT16SZ, &iov[0]);
 750         evConsIovec((void*)buf, buflen, &iov[1]);
 751         int niov = 2;
 752         ssize_t explen = INT16SZ + buflen;
 753         if (buf2 != NULL) {
 754                 len2 = htons ((u_short) buflen2);
 755                 evConsIovec(&len2, INT16SZ, &iov[2]);
 756                 evConsIovec((void*)buf2, buflen2, &iov[3]);
 757                 niov = 4;
 758                 explen += INT16SZ + buflen2;
 759         }
 760         if (TEMP_FAILURE_RETRY (writev(statp->_vcsock, iov, niov)) != explen) {
 761                 *terrno = errno;
 762                 return close_and_return_error (statp, resplen2);
 763         }
 764         /*
 765          * Receive length & response
 766          */
 767         int recvresp1 = 0;
 768         /* Skip the second response if there is no second query.
 769            To do that we mark the second response as received.  */
 770         int recvresp2 = buf2 == NULL;
 771         uint16_t rlen16;
 772  read_len:
 773         cp = (u_char *)&rlen16;
 774         len = sizeof(rlen16);
 775         while ((n = TEMP_FAILURE_RETRY (read(statp->_vcsock, cp,
 776                                              (int)len))) > 0) {
 777                 cp += n;
 778                 if ((len -= n) <= 0)
 779                         break;
 780         }
 781         if (n <= 0) {
 782                 *terrno = errno;
 783                 /*
 784                  * A long running process might get its TCP
 785                  * connection reset if the remote server was
 786                  * restarted.  Requery the server instead of
 787                  * trying a new one.  When there is only one
 788                  * server, this means that a query might work
 789                  * instead of failing.  We only allow one reset
 790                  * per query to prevent looping.
 791                  */
 792                 if (*terrno == ECONNRESET && !connreset)
 793                   {
 794                     __res_iclose (statp, false);
 795                     connreset = 1;
 796                     goto same_ns;
 797                   }
 798                 return close_and_return_error (statp, resplen2);
 799         }
 800         int rlen = ntohs (rlen16);
 801
 802         int *thisanssizp;
 803         u_char **thisansp;
 804         int *thisresplenp;
 805         if ((recvresp1 | recvresp2) == 0 || buf2 == NULL) {
 806                 /* We have not received any responses
 807                    yet or we only have one response to
 808                    receive.  */
 809                 thisanssizp = anssizp;
 810                 thisansp = anscp ?: ansp;
 811                 assert (anscp != NULL || ansp2 == NULL);
 812                 thisresplenp = &resplen;
 813         } else {
 814                 thisanssizp = anssizp2;
 815                 thisansp = ansp2;
 816                 thisresplenp = resplen2;
 817         }
 818         anhp = (HEADER *) *thisansp;
 819
 820         *thisresplenp = rlen;
 821         /* Is the answer buffer too small?  */
 822         if (*thisanssizp < rlen) {
 823                 /* If the current buffer is not the the static
 824                    user-supplied buffer then we can reallocate
 825                    it.  */
 826                 if (thisansp != NULL && thisansp != ansp) {
 827                         /* Always allocate MAXPACKET, callers expect
 828                            this specific size.  */
 829                         u_char *newp = malloc (MAXPACKET);
 830                         if (newp == NULL)
 831                           {
 832                             *terrno = ENOMEM;
 833                             return close_and_return_error (statp, resplen2);
 834                           }
 835                         *thisanssizp = MAXPACKET;
 836                         *thisansp = newp;
 837                         if (thisansp == ansp2)
 838                           *ansp2_malloced = 1;
 839                         anhp = (HEADER *) newp;
 840                         /* A uint16_t can't be larger than MAXPACKET
 841                            thus it's safe to allocate MAXPACKET but
 842                            read RLEN bytes instead.  */
 843                         len = rlen;
 844                 } else {
 845                         truncating = 1;
 846                         len = *thisanssizp;
 847                 }
 848         } else
 849                 len = rlen;
 850
 851         if (__glibc_unlikely (len < HFIXEDSZ))       {
 852                 /*
 853                  * Undersized message.
 854                  */
 855                 *terrno = EMSGSIZE;
 856                 return close_and_return_error (statp, resplen2);
 857         }
 858
 859         cp = *thisansp;
 860         while (len != 0 && (n = read(statp->_vcsock, (char *)cp, (int)len)) > 0){
 861                 cp += n;
 862                 len -= n;
 863         }
 864         if (__glibc_unlikely (n <= 0))       {
 865                 *terrno = errno;
 866                 return close_and_return_error (statp, resplen2);
 867         }
 868         if (__glibc_unlikely (truncating))       {
 869                 /*
 870                  * Flush rest of answer so connection stays in synch.
 871                  */
 872                 anhp->tc = 1;
 873                 len = rlen - *thisanssizp;
 874                 while (len != 0) {
 875                         char junk[PACKETSZ];
 876
 877                         n = read(statp->_vcsock, junk,
 878                                  (len > sizeof junk) ? sizeof junk : len);
 879                         if (n > 0)
 880                                 len -= n;
 881                         else
 882                                 break;
 883                 }
 884         }
 885         /*
 886          * If the calling application has bailed out of
 887          * a previous call and failed to arrange to have
 888          * the circuit closed or the server has got
 889          * itself confused, then drop the packet and
 890          * wait for the correct one.
 891          */
 892         if ((recvresp1 || hp->id != anhp->id)
 893             && (recvresp2 || hp2->id != anhp->id))
 894                 goto read_len;
 895
 896         /* Mark which reply we received.  */
 897         if (recvresp1 == 0 && hp->id == anhp->id)
 898           recvresp1 = 1;
 899         else
 900           recvresp2 = 1;
 901         /* Repeat waiting if we have a second answer to arrive.  */
 902         if ((recvresp1 & recvresp2) == 0)
 903                 goto read_len;
 904
 905         /*
 906          * All is well, or the error is fatal.  Signal that the
 907          * next nameserver ought not be tried.
 908          */
 909         return resplen;
 910 }
 911
 912 static int
 913 reopen (res_state statp, int *terrno, int ns)
 914 {
 915         if (EXT(statp).nssocks[ns] == -1) {
 916                 struct sockaddr *nsap = get_nsaddr (statp, ns);
 917                 socklen_t slen;
 918
 919                 /* only try IPv6 if IPv6 NS and if not failed before */
 920                 if (nsap->sa_family == AF_INET6 && !statp->ipv6_unavail) {
 921                         EXT(statp).nssocks[ns] = socket
 922                           (PF_INET6,
 923                            SOCK_DGRAM | SOCK_NONBLOCK | SOCK_CLOEXEC, 0);
 924                         if (EXT(statp).nssocks[ns] < 0)
 925                             statp->ipv6_unavail = errno == EAFNOSUPPORT;
 926                         slen = sizeof (struct sockaddr_in6);
 927                 } else if (nsap->sa_family == AF_INET) {
 928                         EXT(statp).nssocks[ns] = socket
 929                           (PF_INET,
 930                            SOCK_DGRAM | SOCK_NONBLOCK | SOCK_CLOEXEC, 0);
 931                         slen = sizeof (struct sockaddr_in);
 932                 }
 933                 if (EXT(statp).nssocks[ns] < 0) {
 934                         *terrno = errno;
 935                         return (-1);
 936                 }
 937
 938                 /* Enable full ICMP error reporting for this
 939                    socket.  */
 940                 if (__res_enable_icmp (nsap->sa_family,
 941                                        EXT (statp).nssocks[ns]) < 0)
 942                   {
 943                     int saved_errno = errno;
 944                     __res_iclose (statp, false);
 945                     __set_errno (saved_errno);
 946                     *terrno = saved_errno;
 947                     return -1;
 948                   }
 949
 950                 /*
 951                  * On a 4.3BSD+ machine (client and server,
 952                  * actually), sending to a nameserver datagram
 953                  * port with no nameserver will cause an
 954                  * ICMP port unreachable message to be returned.
 955                  * If our datagram socket is "connected" to the
 956                  * server, we get an ECONNREFUSED error on the next
 957                  * socket operation, and select returns if the
 958                  * error message is received.  We can thus detect
 959                  * the absence of a nameserver without timing out.
 960                  */
 961                 /* With GCC 5.3 when compiling with -Os the compiler
 962                    emits a warning that slen may be used uninitialized,
 963                    but that is never true.  Both slen and
 964                    EXT(statp).nssocks[ns] are initialized together or
 965                    the function return -1 before control flow reaches
 966                    the call to connect with slen.  */
 967                 DIAG_PUSH_NEEDS_COMMENT;
 968                 DIAG_IGNORE_Os_NEEDS_COMMENT (5, "-Wmaybe-uninitialized");
 969                 if (connect(EXT(statp).nssocks[ns], nsap, slen) < 0) {
 970                 DIAG_POP_NEEDS_COMMENT;
 971                         __res_iclose(statp, false);
 972                         return (0);
 973                 }
 974         }
 975
 976         return 1;
 977 }
 978
 979 /* The send_dg function is responsible for sending a DNS query over UDP
 980    to the nameserver numbered NS from the res_state STATP i.e.
 981    EXT(statp).nssocks[ns].  The function supports IPv4 and IPv6 queries
 982    along with the ability to send the query in parallel for both stacks
 983    (default) or serially (RES_SINGLKUP).  It also supports serial lookup
 984    with a close and reopen of the socket used to talk to the server
 985    (RES_SNGLKUPREOP) to work around broken name servers.
 986
 987    The query stored in BUF of BUFLEN length is sent first followed by
 988    the query stored in BUF2 of BUFLEN2 length.  Queries are sent
 989    in parallel (default) or serially (RES_SINGLKUP or RES_SNGLKUPREOP).
 990
 991    Answers to the query are stored firstly in *ANSP up to a max of
 992    *ANSSIZP bytes.  If more than *ANSSIZP bytes are needed and ANSCP
 993    is non-NULL (to indicate that modifying the answer buffer is allowed)
 994    then malloc is used to allocate a new response buffer and ANSCP and
 995    ANSP will both point to the new buffer.  If more than *ANSSIZP bytes
 996    are needed but ANSCP is NULL, then as much of the response as
 997    possible is read into the buffer, but the results will be truncated.
 998    When truncation happens because of a small answer buffer the DNS
 999    packets header field TC will bet set to 1, indicating a truncated
1000    message, while the rest of the UDP packet is discarded.
1001
1002    Answers to the query are stored secondly in *ANSP2 up to a max of
1003    *ANSSIZP2 bytes, with the actual response length stored in
1004    *RESPLEN2.  If more than *ANSSIZP bytes are needed and ANSP2
1005    is non-NULL (required for a second query) then malloc is used to
1006    allocate a new response buffer, *ANSSIZP2 is set to the new buffer
1007    size and *ANSP2_MALLOCED is set to 1.
1008
1009    The ANSP2_MALLOCED argument will eventually be removed as the
1010    change in buffer pointer can be used to detect the buffer has
1011    changed and that the caller should use free on the new buffer.
1012
1013    Note that the answers may arrive in any order from the server and
1014    therefore the first and second answer buffers may not correspond to
1015    the first and second queries.
1016
1017    It is not supported to call this function with a non-NULL ANSP2
1018    but a NULL ANSCP.  Put another way, you can call send_vc with a
1019    single unmodifiable buffer or two modifiable buffers, but no other
1020    combination is supported.
1021
1022    It is the caller's responsibility to free the malloc allocated
1023    buffers by detecting that the pointers have changed from their
1024    original values i.e. *ANSCP or *ANSP2 has changed.
1025
1026    If an answer is truncated because of UDP datagram DNS limits then
1027    *V_CIRCUIT is set to 1 and the return value non-zero to indicate to
1028    the caller to retry with TCP.  The value *GOTSOMEWHERE is set to 1
1029    if any progress was made reading a response from the nameserver and
1030    is used by the caller to distinguish between ECONNREFUSED and
1031    ETIMEDOUT (the latter if *GOTSOMEWHERE is 1).
1032
1033    If errors are encountered then *TERRNO is set to an appropriate
1034    errno value and a zero result is returned for a recoverable error,
1035    and a less-than zero result is returned for a non-recoverable error.
1036
1037    If no errors are encountered then *TERRNO is left unmodified and
1038    a the length of the first response in bytes is returned.  */
1039 static int
1040 send_dg(res_state statp,
1041         const u_char *buf, int buflen, const u_char *buf2, int buflen2,
1042         u_char **ansp, int *anssizp,
1043         int *terrno, int ns, int *v_circuit, int *gotsomewhere, u_char **anscp,
1044         u_char **ansp2, int *anssizp2, int *resplen2, int *ansp2_malloced)
1045 {
1046         const HEADER *hp = (HEADER *) buf;
1047         const HEADER *hp2 = (HEADER *) buf2;
1048         struct timespec now, timeout, finish;
1049         struct pollfd pfd[1];
1050         int ptimeout;
1051         struct sockaddr_in6 from;
1052         int resplen = 0;
1053         int n;
1054
1055         /*
1056          * Compute time for the total operation.
1057          */
1058         int seconds = (statp->retrans << ns);
1059         if (ns > 0)
1060                 seconds /= statp->nscount;
1061         if (seconds <= 0)
1062                 seconds = 1;
1063         bool single_request_reopen = (statp->options & RES_SNGLKUPREOP) != 0;
1064         bool single_request = (((statp->options & RES_SNGLKUP) != 0)
1065                                | single_request_reopen);
1066         int save_gotsomewhere = *gotsomewhere;
1067
1068         int retval;
1069  retry_reopen:
1070         retval = reopen (statp, terrno, ns);
1071         if (retval <= 0)
1072           {
1073             if (resplen2 != NULL)
1074               *resplen2 = 0;
1075             return retval;
1076           }
1077  retry:
1078         evNowTime(&now);
1079         evConsTime(&timeout, seconds, 0);
1080         evAddTime(&finish, &now, &timeout);
1081         int need_recompute = 0;
1082         int nwritten = 0;
1083         int recvresp1 = 0;
1084         /* Skip the second response if there is no second query.
1085            To do that we mark the second response as received.  */
1086         int recvresp2 = buf2 == NULL;
1087         pfd[0].fd = EXT(statp).nssocks[ns];
1088         pfd[0].events = POLLOUT;
1089  wait:
1090         if (need_recompute) {
1091         recompute_resend:
1092                 evNowTime(&now);
1093                 if (evCmpTime(finish, now) <= 0) {
1094                 poll_err_out:
1095                         return close_and_return_error (statp, resplen2);
1096                 }
1097                 evSubTime(&timeout, &finish, &now);
1098                 need_recompute = 0;
1099         }
1100         /* Convert struct timespec in milliseconds.  */
1101         ptimeout = timeout.tv_sec * 1000 + timeout.tv_nsec / 1000000;
1102
1103         n = 0;
1104         if (nwritten == 0)
1105           n = __poll (pfd, 1, 0);
1106         if (__glibc_unlikely (n == 0))       {
1107                 n = __poll (pfd, 1, ptimeout);
1108                 need_recompute = 1;
1109         }
1110         if (n == 0) {
1111                 if (resplen > 1 && (recvresp1 || (buf2 != NULL && recvresp2)))
1112                   {
1113                     /* There are quite a few broken name servers out
1114                        there which don't handle two outstanding
1115                        requests from the same source.  There are also
1116                        broken firewall settings.  If we time out after
1117                        having received one answer switch to the mode
1118                        where we send the second request only once we
1119                        have received the first answer.  */
1120                     if (!single_request)
1121                       {
1122                         statp->options |= RES_SNGLKUP;
1123                         single_request = true;
1124                         *gotsomewhere = save_gotsomewhere;
1125                         goto retry;
1126                       }
1127                     else if (!single_request_reopen)
1128                       {
1129                         statp->options |= RES_SNGLKUPREOP;
1130                         single_request_reopen = true;
1131                         *gotsomewhere = save_gotsomewhere;
1132                         __res_iclose (statp, false);
1133                         goto retry_reopen;
1134                       }
1135
1136                     *resplen2 = 1;
1137                     return resplen;
1138                   }
1139
1140                 *gotsomewhere = 1;
1141                 if (resplen2 != NULL)
1142                   *resplen2 = 0;
1143                 return 0;
1144         }
1145         if (n < 0) {
1146                 if (errno == EINTR)
1147                         goto recompute_resend;
1148
1149                 goto poll_err_out;
1150         }
1151         __set_errno (0);
1152         if (pfd[0].revents & POLLOUT) {
1153 #ifndef __ASSUME_SENDMMSG
1154                 static int have_sendmmsg;
1155 #else
1156 # define have_sendmmsg 1
1157 #endif
1158                 if (have_sendmmsg >= 0 && nwritten == 0 && buf2 != NULL
1159                     && !single_request)
1160                   {
1161                     struct iovec iov =
1162                       { .iov_base = (void *) buf, .iov_len = buflen };
1163                     struct iovec iov2 =
1164                       { .iov_base = (void *) buf2, .iov_len = buflen2 };
1165                     struct mmsghdr reqs[2] =
1166                       {
1167                         {
1168                           .msg_hdr =
1169                             {
1170                               .msg_iov = &iov,
1171                               .msg_iovlen = 1,
1172                             },
1173                         },
1174                         {
1175                           .msg_hdr =
1176                             {
1177                               .msg_iov = &iov2,
1178                               .msg_iovlen = 1,
1179                             }
1180                         },
1181                       };
1182
1183                     int ndg = __sendmmsg (pfd[0].fd, reqs, 2, MSG_NOSIGNAL);
1184                     if (__glibc_likely (ndg == 2))
1185                       {
1186                         if (reqs[0].msg_len != buflen
1187                             || reqs[1].msg_len != buflen2)
1188                           goto fail_sendmmsg;
1189
1190                         pfd[0].events = POLLIN;
1191                         nwritten += 2;
1192                       }
1193                     else if (ndg == 1 && reqs[0].msg_len == buflen)
1194                       goto just_one;
1195                     else if (ndg < 0 && (errno == EINTR || errno == EAGAIN))
1196                       goto recompute_resend;
1197                     else
1198                       {
1199 #ifndef __ASSUME_SENDMMSG
1200                         if (__glibc_unlikely (have_sendmmsg == 0))
1201                           {
1202                             if (ndg < 0 && errno == ENOSYS)
1203                               {
1204                                 have_sendmmsg = -1;
1205                                 goto try_send;
1206                               }
1207                             have_sendmmsg = 1;
1208                           }
1209 #endif
1210
1211                       fail_sendmmsg:
1212                         return close_and_return_error (statp, resplen2);
1213                       }
1214                   }
1215                 else
1216                   {
1217                     ssize_t sr;
1218 #ifndef __ASSUME_SENDMMSG
1219                   try_send:
1220 #endif
1221                     if (nwritten != 0)
1222                       sr = send (pfd[0].fd, buf2, buflen2, MSG_NOSIGNAL);
1223                     else
1224                       sr = send (pfd[0].fd, buf, buflen, MSG_NOSIGNAL);
1225
1226                     if (sr != (nwritten != 0 ? buflen2 : buflen)) {
1227                       if (errno == EINTR || errno == EAGAIN)
1228                         goto recompute_resend;
1229                       return close_and_return_error (statp, resplen2);
1230                     }
1231                   just_one:
1232                     if (nwritten != 0 || buf2 == NULL || single_request)
1233                       pfd[0].events = POLLIN;
1234                     else
1235                       pfd[0].events = POLLIN | POLLOUT;
1236                     ++nwritten;
1237                   }
1238                 goto wait;
1239         } else if (pfd[0].revents & POLLIN) {
1240                 int *thisanssizp;
1241                 u_char **thisansp;
1242                 int *thisresplenp;
1243
1244                 if ((recvresp1 | recvresp2) == 0 || buf2 == NULL) {
1245                         /* We have not received any responses
1246                            yet or we only have one response to
1247                            receive.  */
1248                         thisanssizp = anssizp;
1249                         thisansp = anscp ?: ansp;
1250                         assert (anscp != NULL || ansp2 == NULL);
1251                         thisresplenp = &resplen;
1252                 } else {
1253                         thisanssizp = anssizp2;
1254                         thisansp = ansp2;
1255                         thisresplenp = resplen2;
1256                 }
1257
1258                 if (*thisanssizp < MAXPACKET
1259                     /* If the current buffer is not the the static
1260                        user-supplied buffer then we can reallocate
1261                        it.  */
1262                     && (thisansp != NULL && thisansp != ansp)
1263 #ifdef FIONREAD
1264                     /* Is the size too small?  */
1265                     && (ioctl (pfd[0].fd, FIONREAD, thisresplenp) < 0
1266                         || *thisanssizp < *thisresplenp)
1267 #endif
1268                     ) {
1269                         /* Always allocate MAXPACKET, callers expect
1270                            this specific size.  */
1271                         u_char *newp = malloc (MAXPACKET);
1272                         if (newp != NULL) {
1273                                 *thisanssizp = MAXPACKET;
1274                                 *thisansp = newp;
1275                                 if (thisansp == ansp2)
1276                                   *ansp2_malloced = 1;
1277                         }
1278                 }
1279                 /* We could end up with truncation if anscp was NULL
1280                    (not allowed to change caller's buffer) and the
1281                    response buffer size is too small.  This isn't a
1282                    reliable way to detect truncation because the ioctl
1283                    may be an inaccurate report of the UDP message size.
1284                    Therefore we use this only to issue debug output.
1285                    To do truncation accurately with UDP we need
1286                    MSG_TRUNC which is only available on Linux.  We
1287                    can abstract out the Linux-specific feature in the
1288                    future to detect truncation.  */
1289                 HEADER *anhp = (HEADER *) *thisansp;
1290                 socklen_t fromlen = sizeof(struct sockaddr_in6);
1291                 assert (sizeof(from) <= fromlen);
1292                 *thisresplenp = recvfrom(pfd[0].fd, (char*)*thisansp,
1293                                          *thisanssizp, 0,
1294                                         (struct sockaddr *)&from, &fromlen);
1295                 if (__glibc_unlikely (*thisresplenp <= 0))       {
1296                         if (errno == EINTR || errno == EAGAIN) {
1297                                 need_recompute = 1;
1298                                 goto wait;
1299                         }
1300                         return close_and_return_error (statp, resplen2);
1301                 }
1302                 *gotsomewhere = 1;
1303                 if (__glibc_unlikely (*thisresplenp < HFIXEDSZ))       {
1304                         /*
1305                          * Undersized message.
1306                          */
1307                         *terrno = EMSGSIZE;
1308                         return close_and_return_error (statp, resplen2);
1309                 }
1310                 if ((recvresp1 || hp->id != anhp->id)
1311                     && (recvresp2 || hp2->id != anhp->id)) {
1312                         /*
1313                          * response from old query, ignore it.
1314                          * XXX - potential security hazard could
1315                          *       be detected here.
1316                          */
1317                         goto wait;
1318                 }
1319
1320                 /* Paranoia check.  Due to the connected UDP socket,
1321                    the kernel has already filtered invalid addresses
1322                    for us.  */
1323                 if (!res_ourserver_p(statp, &from))
1324                   goto wait;
1325
1326                 /* Check for the correct header layout and a matching
1327                    question.  */
1328                 if ((recvresp1 || !res_queriesmatch(buf, buf + buflen,
1329                                                        *thisansp,
1330                                                        *thisansp
1331                                                        + *thisanssizp))
1332                     && (recvresp2 || !res_queriesmatch(buf2, buf2 + buflen2,
1333                                                        *thisansp,
1334                                                        *thisansp
1335                                                        + *thisanssizp)))
1336                   goto wait;
1337
1338                 if (anhp->rcode == SERVFAIL ||
1339                     anhp->rcode == NOTIMP ||
1340                     anhp->rcode == REFUSED) {
1341                 next_ns:
1342                         if (recvresp1 || (buf2 != NULL && recvresp2)) {
1343                           *resplen2 = 0;
1344                           return resplen;
1345                         }
1346                         if (buf2 != NULL)
1347                           {
1348                             /* No data from the first reply.  */
1349                             resplen = 0;
1350                             /* We are waiting for a possible second reply.  */
1351                             if (hp->id == anhp->id)
1352                               recvresp1 = 1;
1353                             else
1354                               recvresp2 = 1;
1355
1356                             goto wait;
1357                           }
1358
1359                         /* don't retry if called from dig */
1360                         if (!statp->pfcode)
1361                           return close_and_return_error (statp, resplen2);
1362                         __res_iclose(statp, false);
1363                 }
1364                 if (anhp->rcode == NOERROR && anhp->ancount == 0
1365                     && anhp->aa == 0 && anhp->ra == 0 && anhp->arcount == 0) {
1366                         goto next_ns;
1367                 }
1368                 if (!(statp->options & RES_IGNTC) && anhp->tc) {
1369                         /*
1370                          * To get the rest of answer,
1371                          * use TCP with same server.
1372                          */
1373                         *v_circuit = 1;
1374                         __res_iclose(statp, false);
1375                         // XXX if we have received one reply we could
1376                         // XXX use it and not repeat it over TCP...
1377                         if (resplen2 != NULL)
1378                           *resplen2 = 0;
1379                         return (1);
1380                 }
1381                 /* Mark which reply we received.  */
1382                 if (recvresp1 == 0 && hp->id == anhp->id)
1383                         recvresp1 = 1;
1384                 else
1385                         recvresp2 = 1;
1386                 /* Repeat waiting if we have a second answer to arrive.  */
1387                 if ((recvresp1 & recvresp2) == 0) {
1388                         if (single_request) {
1389                                 pfd[0].events = POLLOUT;
1390                                 if (single_request_reopen) {
1391                                         __res_iclose (statp, false);
1392                                         retval = reopen (statp, terrno, ns);
1393                                         if (retval <= 0)
1394                                           {
1395                                             if (resplen2 != NULL)
1396                                               *resplen2 = 0;
1397                                             return retval;
1398                                           }
1399                                         pfd[0].fd = EXT(statp).nssocks[ns];
1400                                 }
1401                         }
1402                         goto wait;
1403                 }
1404                 /* All is well.  We have received both responses (if
1405                    two responses were requested).  */
1406                 return (resplen);
1407         } else if (pfd[0].revents & (POLLERR | POLLHUP | POLLNVAL))
1408           /* Something went wrong.  We can stop trying.  */
1409           return close_and_return_error (statp, resplen2);
1410         else {
1411                 /* poll should not have returned > 0 in this case.  */
1412                 abort ();
1413         }
1414 }
1415
1416 static int
1417 sock_eq(struct sockaddr_in6 *a1, struct sockaddr_in6 *a2) {
1418         if (a1->sin6_family == a2->sin6_family) {
1419                 if (a1->sin6_family == AF_INET)
1420                         return ((((struct sockaddr_in *)a1)->sin_port ==
1421                                  ((struct sockaddr_in *)a2)->sin_port) &&
1422                                 (((struct sockaddr_in *)a1)->sin_addr.s_addr ==
1423                                  ((struct sockaddr_in *)a2)->sin_addr.s_addr));
1424                 else
1425                         return ((a1->sin6_port == a2->sin6_port) &&
1426                                 !memcmp(&a1->sin6_addr, &a2->sin6_addr,
1427                                         sizeof (struct in6_addr)));
1428         }
1429         if (a1->sin6_family == AF_INET) {
1430                 struct sockaddr_in6 *sap = a1;
1431                 a1 = a2;
1432                 a2 = sap;
1433         } /* assumes that AF_INET and AF_INET6 are the only possibilities */
1434         return ((a1->sin6_port == ((struct sockaddr_in *)a2)->sin_port) &&
1435                 IN6_IS_ADDR_V4MAPPED(&a1->sin6_addr) &&
1436                 (a1->sin6_addr.s6_addr32[3] ==
1437                  ((struct sockaddr_in *)a2)->sin_addr.s_addr));
1438 }