/* $OpenBSD: res_send.c,v 1.21 2008/05/11 05:03:03 brad Exp $ */ /* * ++Copyright++ 1985, 1989, 1993 * - * Copyright (c) 1985, 1989, 1993 * The Regents of the University of California. All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * 1. Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * 3. Neither the name of the University nor the names of its contributors * may be used to endorse or promote products derived from this software * without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF * SUCH DAMAGE. * - * Portions Copyright (c) 1993 by Digital Equipment Corporation. * * Permission to use, copy, modify, and distribute this software for any * purpose with or without fee is hereby granted, provided that the above * copyright notice and this permission notice appear in all copies, and that * the name of Digital Equipment Corporation not be used in advertising or * publicity pertaining to distribution of the document or software without * specific, written prior permission. * * THE SOFTWARE IS PROVIDED "AS IS" AND DIGITAL EQUIPMENT CORP. DISCLAIMS ALL * WARRANTIES WITH REGARD TO THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES * OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL DIGITAL EQUIPMENT * CORPORATION BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS * ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS * SOFTWARE. * - * --Copyright-- */ #ifndef INET6 #define INET6 #endif /* change this to "0" * if you talk to a lot * of multi-homed SunOS * ("broken") name servers. */ #define CHECK_SRVR_ADDR 1 /* XXX - should be in options.h */ /* * Send query to name server and wait for reply. */ #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include "thread_private.h" static int s = -1; /* socket used for communications */ static int connected = 0; /* is the socket connected */ static int vc = 0; /* is the socket a virtual ciruit? */ static int af = 0; /* address family of socket */ #define CAN_RECONNECT 1 #ifndef DEBUG # define Dprint(cond, args) /*empty*/ # define DprintQ(cond, args, query, size) /*empty*/ # define Aerror(file, string, error, address) /*empty*/ # define Perror(file, string, error) /*empty*/ #else # define Dprint(cond, args) if (cond) {fprintf args;} else {} # define DprintQ(cond, args, query, size) if (cond) {\ fprintf args;\ __fp_nquery(query, size, stdout);\ } else {} static char abuf[NI_MAXHOST]; static char pbuf[NI_MAXSERV]; static void Aerror(FILE *, char *, int, struct sockaddr *); static void Perror(FILE *, char *, int); static void Aerror(FILE *file, char *string, int error, struct sockaddr *address) { struct __res_state *_resp = _THREAD_PRIVATE(_res, _res, &_res); int save = errno; if (_resp->options & RES_DEBUG) { if (getnameinfo(address, address->sa_len, abuf, sizeof(abuf), pbuf, sizeof(pbuf), NI_NUMERICHOST | NI_NUMERICSERV) != 0) { strlcpy(abuf, "?", sizeof(abuf)); strlcpy(pbuf, "?", sizeof(pbuf)); } fprintf(file, "res_send: %s ([%s].%s): %s\n", string, abuf, pbuf, strerror(error)); } errno = save; } static void Perror(FILE *file, char *string, int error) { struct __res_state *_resp = _THREAD_PRIVATE(_res, _res, &_res); int save = errno; if (_resp->options & RES_DEBUG) { fprintf(file, "res_send: %s: %s\n", string, strerror(error)); } errno = save; } #endif static res_send_qhook Qhook = NULL; static res_send_rhook Rhook = NULL; void res_send_setqhook(res_send_qhook hook) { Qhook = hook; } void res_send_setrhook(res_send_rhook hook) { Rhook = hook; } #ifdef INET6 static struct sockaddr * get_nsaddr(size_t); /* * pick appropriate nsaddr_list for use. see res_init() for initialization. */ static struct sockaddr * get_nsaddr(size_t n) { struct __res_state *_resp = _THREAD_PRIVATE(_res, _res, &_res); struct __res_state_ext *_res_extp = _THREAD_PRIVATE(_res_ext, _res_ext, &_res_ext); if (!_resp->nsaddr_list[n].sin_family) { /* * - _res_extp->nsaddr_list[n] holds an address that is larger * than struct sockaddr, and * - user code did not update _resp->nsaddr_list[n]. */ return (struct sockaddr *)&_res_extp->nsaddr_list[n]; } else { /* * - user code updated _res.nsaddr_list[n], or * - _resp->nsaddr_list[n] has the same content as * _res_extp->nsaddr_list[n]. */ return (struct sockaddr *)&_resp->nsaddr_list[n]; } } #else #define get_nsaddr(n) ((struct sockaddr *)&_resp->nsaddr_list[(n)]) #endif /* int * res_isourserver(ina) * looks up "ina" in _resp->ns_addr_list[] * returns: * 0 : not found * >0 : found * author: * paul vixie, 29may94 */ int res_isourserver(const struct sockaddr_in *inp) { struct __res_state *_resp = _THREAD_PRIVATE(_res, _res, &_res); #ifdef INET6 const struct sockaddr_in6 *in6p = (const struct sockaddr_in6 *)inp; const struct sockaddr_in6 *srv6; #endif const struct sockaddr_in *srv; int ns, ret; ret = 0; switch (inp->sin_family) { #ifdef INET6 case AF_INET6: for (ns = 0; ns < _resp->nscount; ns++) { srv6 = (struct sockaddr_in6 *)get_nsaddr(ns); if (srv6->sin6_family == in6p->sin6_family && srv6->sin6_port == in6p->sin6_port && srv6->sin6_scope_id == in6p->sin6_scope_id && (IN6_IS_ADDR_UNSPECIFIED(&srv6->sin6_addr) || IN6_ARE_ADDR_EQUAL(&srv6->sin6_addr, &in6p->sin6_addr))) { ret++; break; } } break; #endif case AF_INET: for (ns = 0; ns < _resp->nscount; ns++) { srv = (struct sockaddr_in *)get_nsaddr(ns); if (srv->sin_family == inp->sin_family && srv->sin_port == inp->sin_port && (srv->sin_addr.s_addr == INADDR_ANY || srv->sin_addr.s_addr == inp->sin_addr.s_addr)) { ret++; break; } } break; } return (ret); } /* int * res_nameinquery(name, type, class, buf, eom) * look for (name,type,class) in the query section of packet (buf,eom) * returns: * -1 : format error * 0 : not found * >0 : found * author: * paul vixie, 29may94 */ int res_nameinquery(const char *name, int type, int class, const u_char *buf, const u_char *eom) { const u_char *cp = buf + HFIXEDSZ; int qdcount = ntohs(((HEADER*)buf)->qdcount); while (qdcount-- > 0) { char tname[MAXDNAME+1]; int n, ttype, tclass; n = dn_expand(buf, eom, cp, tname, sizeof tname); if (n < 0) return (-1); cp += n; ttype = _getshort(cp); cp += INT16SZ; tclass = _getshort(cp); cp += INT16SZ; if (ttype == type && tclass == class && strcasecmp(tname, name) == 0) return (1); } return (0); } /* int * res_queriesmatch(buf1, eom1, buf2, eom2) * is there a 1:1 mapping of (name,type,class) * in (buf1,eom1) and (buf2,eom2)? * returns: * -1 : format error * 0 : not a 1:1 mapping * >0 : is a 1:1 mapping * author: * paul vixie, 29may94 */ int res_queriesmatch(const u_char *buf1, const u_char *eom1, const u_char *buf2, const u_char *eom2) { const u_char *cp = buf1 + HFIXEDSZ; int qdcount = ntohs(((HEADER*)buf1)->qdcount); if (qdcount != ntohs(((HEADER*)buf2)->qdcount)) return (0); while (qdcount-- > 0) { char tname[MAXDNAME+1]; int n, ttype, tclass; n = dn_expand(buf1, eom1, cp, tname, sizeof tname); if (n < 0) return (-1); cp += n; ttype = _getshort(cp); cp += INT16SZ; tclass = _getshort(cp); cp += INT16SZ; if (!res_nameinquery(tname, ttype, tclass, buf2, eom2)) return (0); } return (1); } int res_send(const u_char *buf, int buflen, u_char *ans, int anssiz) { struct __res_state *_resp = _THREAD_PRIVATE(_res, _res, &_res); HEADER *hp = (HEADER *) buf; HEADER *anhp = (HEADER *) ans; int gotsomewhere, connreset, terrno, try, v_circuit, resplen, ns; int n; u_int badns; /* XXX NSMAX can't exceed #/bits in this var */ if (_res_init(0) == -1) { /* errno should have been set by res_init() in this case. */ return (-1); } DprintQ((_resp->options & RES_DEBUG) || (_resp->pfcode & RES_PRF_QUERY), (stdout, ";; res_send()\n"), buf, buflen); v_circuit = (_resp->options & RES_USEVC) || buflen > PACKETSZ; gotsomewhere = 0; connreset = 0; terrno = ETIMEDOUT; badns = 0; /* * Send request, RETRY times, or until successful */ for (try = 0; try < _resp->retry; try++) { for (ns = 0; ns < _resp->nscount; ns++) { struct sockaddr *nsap = get_nsaddr(ns); socklen_t salen; if (nsap->sa_len) salen = nsap->sa_len; #ifdef INET6 else if (nsap->sa_family == AF_INET6) salen = sizeof(struct sockaddr_in6); #endif else if (nsap->sa_family == AF_INET) salen = sizeof(struct sockaddr_in); else salen = 0; /*unknown, die on connect*/ same_ns: if (badns & (1 << ns)) { res_close(); goto next_ns; } if (Qhook) { int done = 0, loops = 0; do { res_sendhookact act; act = (*Qhook)((struct sockaddr_in **)&nsap, &buf, &buflen, ans, anssiz, &resplen); switch (act) { case res_goahead: done = 1; break; case res_nextns: res_close(); goto next_ns; case res_done: return (resplen); case res_modified: /* give the hook another try */ if (++loops < 42) /*doug adams*/ break; /*FALLTHROUGH*/ case res_error: /*FALLTHROUGH*/ default: return (-1); } } while (!done); } Dprint((_resp->options & RES_DEBUG) && getnameinfo(nsap, salen, abuf, sizeof(abuf), NULL, 0, NI_NUMERICHOST) == 0, (stdout, ";; Querying server (# %d) address = %s\n", ns + 1, abuf)); if (v_circuit) { int truncated; struct iovec iov[2]; u_short len; u_char *cp; /* * Use virtual circuit; * at most one attempt per server. */ try = _resp->retry; truncated = 0; if ((s < 0) || (!vc) || (af != nsap->sa_family)) { if (s >= 0) res_close(); af = nsap->sa_family; s = socket(af, SOCK_STREAM, 0); if (s < 0) { terrno = errno; Perror(stderr, "socket(vc)", errno); #if 0 return (-1); #else badns |= (1 << ns); res_close(); goto next_ns; #endif } errno = 0; if (connect(s, nsap, salen) < 0) { terrno = errno; Aerror(stderr, "connect/vc", errno, nsap); badns |= (1 << ns); res_close(); goto next_ns; } vc = 1; } /* * Send length & message */ putshort((u_short)buflen, (u_char*)&len); iov[0].iov_base = (caddr_t)&len; iov[0].iov_len = INT16SZ; iov[1].iov_base = (caddr_t)buf; iov[1].iov_len = buflen; if (writev(s, iov, 2) != (INT16SZ + buflen)) { terrno = errno; Perror(stderr, "write failed", errno); badns |= (1 << ns); res_close(); goto next_ns; } /* * Receive length & response */ read_len: cp = ans; len = INT16SZ; while ((n = read(s, (char *)cp, (int)len)) > 0) { cp += n; if ((len -= n) <= 0) break; } if (n <= 0) { terrno = errno; Perror(stderr, "read failed", errno); res_close(); /* * A long running process might get its TCP * connection reset if the remote server was * restarted. Requery the server instead of * trying a new one. When there is only one * server, this means that a query might work * instead of failing. We only allow one reset * per query to prevent looping. */ if (terrno == ECONNRESET && !connreset) { connreset = 1; res_close(); goto same_ns; } res_close(); goto next_ns; } resplen = _getshort(ans); if (resplen > anssiz) { Dprint(_resp->options & RES_DEBUG, (stdout, ";; response truncated\n") ); truncated = 1; len = anssiz; } else len = resplen; cp = ans; while (len != 0 && (n = read(s, (char *)cp, (int)len)) > 0) { cp += n; len -= n; } if (n <= 0) { terrno = errno; Perror(stderr, "read(vc)", errno); res_close(); goto next_ns; } if (truncated) { /* * Flush rest of answer * so connection stays in synch. */ anhp->tc = 1; len = resplen - anssiz; while (len != 0) { char junk[PACKETSZ]; n = (len > sizeof(junk) ? sizeof(junk) : len); if ((n = read(s, junk, n)) > 0) len -= n; else break; } } /* * The calling applicating has bailed out of * a previous call and failed to arrange to have * the circuit closed or the server has got * itself confused. Anyway drop the packet and * wait for the correct one. */ if (hp->id != anhp->id) { DprintQ((_resp->options & RES_DEBUG) || (_resp->pfcode & RES_PRF_REPLY), (stdout, ";; old answer (unexpected):\n"), ans, (resplen>anssiz)?anssiz:resplen); goto read_len; } } else { /* * Use datagrams. */ struct pollfd pfd; int timeout; struct sockaddr_storage from; socklen_t fromlen; if ((s < 0) || vc || (af != nsap->sa_family)) { if (vc) res_close(); af = nsap->sa_family; s = socket(af, SOCK_DGRAM, 0); if (s < 0) { #if !CAN_RECONNECT bad_dg_sock: #endif terrno = errno; Perror(stderr, "socket(dg)", errno); #if 0 return (-1); #else badns |= (1 << ns); res_close(); goto next_ns; #endif } #ifdef IPV6_MINMTU if (af == AF_INET6) { const int yes = 1; (void)setsockopt(s, IPPROTO_IPV6, IPV6_USE_MIN_MTU, &yes, sizeof(yes)); } #endif connected = 0; } /* * On a 4.3BSD+ machine (client and server, * actually), sending to a nameserver datagram * port with no nameserver will cause an * ICMP port unreachable message to be returned. * If our datagram socket is "connected" to the * server, we get an ECONNREFUSED error on the next * socket operation, and poll returns if the * error message is received. We can thus detect * the absence of a nameserver without timing out. * If we have sent queries to at least two servers, * however, we don't want to remain connected, * as we wish to receive answers from the first * server to respond. */ if (!(_resp->options & RES_INSECURE1) && (_resp->nscount == 1 || (try == 0 && ns == 0))) { /* * Connect only if we are sure we won't * receive a response from another server. */ if (!connected) { if (connect(s, nsap, salen) < 0) { Aerror(stderr, "connect(dg)", errno, nsap); badns |= (1 << ns); res_close(); goto next_ns; } connected = 1; } if (send(s, (char*)buf, buflen, 0) != buflen) { Perror(stderr, "send", errno); badns |= (1 << ns); res_close(); goto next_ns; } } else { /* * Disconnect if we want to listen * for responses from more than one server. */ if (connected) { #if CAN_RECONNECT #ifdef INET6 /* XXX: any errornous address */ #endif /* INET6 */ struct sockaddr_in no_addr; no_addr.sin_family = AF_INET; no_addr.sin_addr.s_addr = INADDR_ANY; no_addr.sin_port = 0; (void) connect(s, (struct sockaddr *) &no_addr, sizeof(no_addr)); #else int s1 = socket(af, SOCK_DGRAM,0); if (s1 < 0) goto bad_dg_sock; (void) dup2(s1, s); (void) close(s1); Dprint(_resp->options & RES_DEBUG, (stdout, ";; new DG socket\n")) #endif #ifdef IPV6_MINMTU if (af == AF_INET6) { const int yes = 1; (void)setsockopt(s, IPPROTO_IPV6, IPV6_USE_MIN_MTU, &yes, sizeof(yes)); } #endif connected = 0; errno = 0; } if (sendto(s, (char*)buf, buflen, 0, nsap, salen) != buflen) { Aerror(stderr, "sendto", errno, nsap); badns |= (1 << ns); res_close(); goto next_ns; } } /* * Wait for reply */ timeout = 1000 * (_resp->retrans << try); if (try > 0) timeout /= _resp->nscount; if (timeout < 1000) timeout = 1000; wait: pfd.fd = s; pfd.events = POLLIN; n = poll(&pfd, 1, timeout); if (n < 0) { if (errno == EINTR) goto wait; Perror(stderr, "poll", errno); res_close(); goto next_ns; } if (n == 0) { /* * timeout */ Dprint(_resp->options & RES_DEBUG, (stdout, ";; timeout\n")); gotsomewhere = 1; res_close(); goto next_ns; } errno = 0; fromlen = sizeof(from); resplen = recvfrom(s, (char*)ans, anssiz, 0, (struct sockaddr *)&from, &fromlen); if (resplen <= 0) { Perror(stderr, "recvfrom", errno); res_close(); goto next_ns; } gotsomewhere = 1; if (hp->id != anhp->id) { /* * response from old query, ignore it. * XXX - potential security hazard could * be detected here. */ DprintQ((_resp->options & RES_DEBUG) || (_resp->pfcode & RES_PRF_REPLY), (stdout, ";; old answer:\n"), ans, (resplen>anssiz)?anssiz:resplen); goto wait; } #if CHECK_SRVR_ADDR if (!(_resp->options & RES_INSECURE1) && !res_isourserver((struct sockaddr_in *)&from)) { /* * response from wrong server? ignore it. * XXX - potential security hazard could * be detected here. */ DprintQ((_resp->options & RES_DEBUG) || (_resp->pfcode & RES_PRF_REPLY), (stdout, ";; not our server:\n"), ans, (resplen>anssiz)?anssiz:resplen); goto wait; } #endif if (!(_resp->options & RES_INSECURE2) && !res_queriesmatch(buf, buf + buflen, ans, ans + anssiz)) { /* * response contains wrong query? ignore it. * XXX - potential security hazard could * be detected here. */ DprintQ((_resp->options & RES_DEBUG) || (_resp->pfcode & RES_PRF_REPLY), (stdout, ";; wrong query name:\n"), ans, (resplen>anssiz)?anssiz:resplen); goto wait; } if (anhp->rcode == SERVFAIL || anhp->rcode == NOTIMP || anhp->rcode == REFUSED) { DprintQ(_resp->options & RES_DEBUG, (stdout, "server rejected query:\n"), ans, (resplen>anssiz)?anssiz:resplen); badns |= (1 << ns); res_close(); /* don't retry if called from dig */ if (!_resp->pfcode) goto next_ns; } if (!(_resp->options & RES_IGNTC) && anhp->tc) { /* * get rest of answer; * use TCP with same server. */ Dprint(_resp->options & RES_DEBUG, (stdout, ";; truncated answer\n")); v_circuit = 1; res_close(); goto same_ns; } } /*if vc/dg*/ Dprint((_resp->options & RES_DEBUG) || ((_resp->pfcode & RES_PRF_REPLY) && (_resp->pfcode & RES_PRF_HEAD1)), (stdout, ";; got answer:\n")); DprintQ((_resp->options & RES_DEBUG) || (_resp->pfcode & RES_PRF_REPLY), (stdout, "%s", ""), ans, (resplen>anssiz)?anssiz:resplen); /* * If using virtual circuits, we assume that the first server * is preferred over the rest (i.e. it is on the local * machine) and only keep that one open. * If we have temporarily opened a virtual circuit, * or if we haven't been asked to keep a socket open, * close the socket. */ if ((v_circuit && (!(_resp->options & RES_USEVC) || ns != 0)) || !(_resp->options & RES_STAYOPEN)) { res_close(); } if (Rhook) { int done = 0, loops = 0; do { res_sendhookact act; act = (*Rhook)((struct sockaddr_in *)nsap, buf, buflen, ans, anssiz, &resplen); switch (act) { case res_goahead: case res_done: done = 1; break; case res_nextns: res_close(); goto next_ns; case res_modified: /* give the hook another try */ if (++loops < 42) /*doug adams*/ break; /*FALLTHROUGH*/ case res_error: /*FALLTHROUGH*/ default: return (-1); } } while (!done); } return (resplen); next_ns: ; } /*foreach ns*/ } /*foreach retry*/ res_close(); if (!v_circuit) { if (!gotsomewhere) errno = ECONNREFUSED; /* no nameservers found */ else errno = ETIMEDOUT; /* no answer obtained */ } else errno = terrno; return (-1); } /* * This routine is for closing the socket if a virtual circuit is used and * the program wants to close it. This provides support for endhostent() * which expects to close the socket. * * This routine is not expected to be user visible. */ void res_close(void) { if (s >= 0) { (void) close(s); s = -1; connected = 0; vc = 0; af = 0; } }