#pragma ident "@(#)nfs_cast.c 1.26 05/06/08 SMI"
#include <stdio.h>
#include <syslog.h>
#include <errno.h>
#include <string.h>
#include <sys/types.h>
#include <sys/time.h>
#include <sys/resource.h>
#include <unistd.h>
#include <stdlib.h>
#include <oncrpc/rpc.h>
#include <oncrpc/pmap_prot.h>
#include <sys/socket.h>
#include <netdb.h>
#define NFSCLIENT
#include <locale.h>
#include "automount.h"
#define PENALTY_WEIGHT 100000
struct tstamps {
struct tstamps *ts_next;
int ts_penalty;
int ts_inx;
int ts_rcvd;
struct timeval ts_timeval;
};
struct addrs {
struct addrs *addr_next;
struct mapfs *addr_mfs;
struct hostent *addr_addrs;
struct tstamps *addr_if_tstamps;
};
struct transp {
struct transp *tr_next;
int tr_fd;
const char *tr_afname;
struct addrs *tr_addrs;
};
struct sm {
struct mapfs *mfs;
struct timeval timeval;
};
static void free_transports(struct transp *);
static void calc_resp_time(struct timeval *);
static struct mapfs *sort_responses(struct transp *);
static int host_sm(const void *, const void *b);
static int time_sm(const void *, const void *b);
extern struct mapfs *add_mfs(struct mapfs *, int, struct mapfs **,
struct mapfs **);
struct aftype {
int afnum;
char *name;
};
enum clnt_stat
nfs_cast(struct mapfs *mfs_in, struct mapfs **mfs_out, int timeout)
{
struct servent *portmap;
enum clnt_stat clnt_stat;
AUTH *sys_auth = authunix_create_default();
XDR xdr_stream;
register XDR *xdrs = &xdr_stream;
int outlen;
static const struct aftype aflist[] = {
{ AF_INET, "IPv4" },
#ifdef HAVE_IPV6_SUPPORT
{ AF_INET6, "IPv6" }
#endif
};
#define N_AFS (sizeof aflist / sizeof aflist[0])
int if_inx;
int tsec;
int sent, addr_cnt, rcvd;
fd_set readfds, mask;
register uint32_t xid;
register int i;
struct rpc_msg msg;
struct timeval t, rcv_timeout;
char outbuf[UDPMSGSIZE], inbuf[UDPMSGSIZE];
struct hostent *hp;
int error_num;
char **hostaddrs;
struct sockaddr_storage to_addr;
struct sockaddr *to;
struct sockaddr_storage from_addr;
socklen_t fromlen;
ssize_t len;
struct transp *tr_head;
struct transp *trans, *prev_trans;
struct addrs *a, *prev_addr;
struct tstamps *ts, *prev_ts;
size_t af_idx;
int af;
struct rlimit rl;
int dtbsize;
struct mapfs *mfs;
portmap = getservbyname("sunrpc", "udp");
addr_cnt = sent = rcvd = 0;
tr_head = NULL;
FD_ZERO(&mask);
dtbsize = FD_SETSIZE;
if (getrlimit(RLIMIT_NOFILE, &rl) == 0) {
if (rl.rlim_cur < FD_SETSIZE)
dtbsize = (int)rl.rlim_cur;
}
prev_trans = NULL;
prev_addr = NULL;
prev_ts = NULL;
for (mfs = mfs_in; mfs; mfs = mfs->mfs_next) {
if (trace > 2)
trace_prt(1, "nfs_cast: host=%s\n", mfs->mfs_host);
for (af_idx = 0; af_idx < N_AFS; af_idx++) {
af = aflist[af_idx].afnum;
trans = (struct transp *)malloc(sizeof (*trans));
if (trans == NULL) {
syslog(LOG_ERR, "no memory");
clnt_stat = RPC_CANTSEND;
goto done_broad;
}
(void) memset(trans, 0, sizeof (*trans));
if (tr_head == NULL)
tr_head = trans;
else
prev_trans->tr_next = trans;
prev_trans = trans;
trans->tr_fd = socket(af, SOCK_DGRAM, IPPROTO_UDP);
if (trans->tr_fd < 0) {
syslog(LOG_ERR, "nfscast: UDP %s socket: %m",
aflist[af_idx].name);
clnt_stat = RPC_CANTSEND;
goto done_broad;
}
trans->tr_afname = aflist[af_idx].name;
FD_SET(trans->tr_fd, &mask);
if_inx = 0;
hp = getipnodebyname(mfs->mfs_host, af, AI_DEFAULT, &error_num);
if (hp != NULL) {
if (mfs->mfs_ignore == 1)
mfs->mfs_ignore = 0;
a = (struct addrs *)malloc(sizeof (*a));
if (a == NULL) {
syslog(LOG_ERR, "no memory");
clnt_stat = RPC_CANTSEND;
freehostent(hp);
goto done_broad;
}
(void) memset(a, 0, sizeof (*a));
if (trans->tr_addrs == NULL)
trans->tr_addrs = a;
else
prev_addr->addr_next = a;
prev_addr = a;
a->addr_if_tstamps = NULL;
a->addr_mfs = mfs;
a->addr_addrs = hp;
hostaddrs = hp->h_addr_list;
while (*hostaddrs) {
ts = (struct tstamps *)
malloc(sizeof (*ts));
if (ts == NULL) {
syslog(LOG_ERR, "no memory");
clnt_stat = RPC_CANTSEND;
goto done_broad;
}
(void) memset(ts, 0, sizeof (*ts));
ts->ts_penalty = mfs->mfs_penalty;
if (a->addr_if_tstamps == NULL)
a->addr_if_tstamps = ts;
else
prev_ts->ts_next = ts;
prev_ts = ts;
ts->ts_inx = if_inx++;
addr_cnt++;
hostaddrs++;
}
break;
} else {
mfs->mfs_ignore = 1;
if (verbose)
syslog(LOG_ERR,
"%s:%s address not known",
mfs->mfs_host,
aflist[af_idx].name);
}
}
}
if (addr_cnt == 0) {
syslog(LOG_ERR, "nfscast: couldn't find addresses");
clnt_stat = RPC_CANTSEND;
goto done_broad;
}
(void) gettimeofday(&t, (struct timezone *)0);
xid = (uint32_t)(getpid() ^ t.tv_sec ^ t.tv_usec) & ~0xFF;
t.tv_usec = 0;
msg.rm_direction = CALL;
msg.rm_call.cb_rpcvers = RPC_MSG_VERSION;
msg.rm_call.cb_prog = PMAPPROG;
msg.rm_call.cb_vers = PMAPVERS;
msg.rm_call.cb_proc = NULLPROC;
if (sys_auth == (AUTH *)NULL) {
clnt_stat = RPC_SYSTEMERROR;
goto done_broad;
}
msg.rm_call.cb_cred = sys_auth->ah_cred;
msg.rm_call.cb_verf = sys_auth->ah_verf;
xdrmem_create(xdrs, (uint8_t *) outbuf, sizeof (outbuf), XDR_ENCODE);
if (! xdr_callmsg(xdrs, &msg)) {
clnt_stat = RPC_CANTENCODEARGS;
goto done_broad;
}
outlen = (int)xdr_getpos(xdrs);
xdr_destroy(xdrs);
for (tsec = 4; timeout > 0; tsec *= 2) {
timeout -= tsec;
if (timeout <= 0)
tsec += timeout;
rcv_timeout.tv_sec = tsec;
rcv_timeout.tv_usec = 0;
sent = 0;
for (trans = tr_head; trans; trans = trans->tr_next) {
for (a = trans->tr_addrs; a; a = a->addr_next) {
ts = a->addr_if_tstamps;
hp = a->addr_addrs;
hostaddrs = hp->h_addr_list;
while (*hostaddrs) {
*((uint32_t *)outbuf) =
htonl(xid + ts->ts_inx);
(void) gettimeofday(&(ts->ts_timeval),
(struct timezone *)0);
if (ts->ts_rcvd) {
sent++;
ts = ts->ts_next;
continue;
}
to = (struct sockaddr *)&to_addr;
to->sa_family = hp->h_addrtype;
if (to->sa_family == AF_INET) {
struct sockaddr_in *sin;
sin = (struct sockaddr_in *)to;
to->sa_len = sizeof(*sin);
sin->sin_port = portmap->s_port;
memcpy(&sin->sin_addr,
*hostaddrs++, hp->h_length);
} else {
struct sockaddr_in6 *sin6;
sin6 = (struct sockaddr_in6 *)to;
to->sa_len = sizeof(*sin6);
sin6->sin6_port = portmap->s_port;
memcpy(&sin6->sin6_addr,
*hostaddrs++, hp->h_length);
}
if (sendto(trans->tr_fd, outbuf,
outlen, 0, to, to->sa_len) != -1) {
sent++;
}
ts = ts->ts_next;
}
}
}
if (sent == 0) {
clnt_stat = RPC_CANTSEND;
goto done_broad;
}
rcvd = 0;
recv_again:
msg.acpted_rply.ar_verf = _null_auth;
msg.acpted_rply.ar_results.proc = (xdrproc_t)xdr_void;
readfds = mask;
switch (select(dtbsize, &readfds,
(fd_set *)NULL, (fd_set *)NULL, &rcv_timeout)) {
case 0:
if (rcvd > 0)
goto done_broad;
clnt_stat = RPC_TIMEDOUT;
continue;
case -1:
if (errno == EINTR)
goto recv_again;
syslog(LOG_ERR, "nfscast: select: %m");
if (rcvd == 0)
clnt_stat = RPC_CANTRECV;
goto done_broad;
}
for (trans = tr_head; trans; trans = trans->tr_next) {
if (FD_ISSET(trans->tr_fd, &readfds))
break;
}
if (trans == NULL)
goto recv_again;
try_again:
len = recvfrom(trans->tr_fd, inbuf, sizeof (inbuf), 0,
(struct sockaddr *)&from_addr, &fromlen);
if (len < 0) {
if (errno == EINTR)
goto try_again;
syslog(LOG_ERR, "nfscast: recvfrom: UDP %s:%m",
trans->tr_afname);
clnt_stat = RPC_CANTRECV;
continue;
}
if ((size_t)len < sizeof (uint32_t))
goto recv_again;
xdrmem_create(xdrs, (uint8_t *) inbuf, (uint_t)len, XDR_DECODE);
if (xdr_replymsg(xdrs, &msg)) {
if (msg.rm_reply.rp_stat == MSG_ACCEPTED &&
(msg.rm_xid & ~0xFF) == xid) {
struct addrs *curr_addr;
i = msg.rm_xid & 0xFF;
for (curr_addr = trans->tr_addrs; curr_addr;
curr_addr = curr_addr->addr_next) {
for (ts = curr_addr->addr_if_tstamps; ts;
ts = ts->ts_next)
if (ts->ts_inx == i && !ts->ts_rcvd) {
ts->ts_rcvd = 1;
calc_resp_time(&ts->ts_timeval);
clnt_stat = RPC_SUCCESS;
rcvd++;
break;
}
}
}
}
xdrs->x_op = XDR_FREE;
msg.acpted_rply.ar_results.proc = (xdrproc_t)xdr_void;
(void) xdr_replymsg(xdrs, &msg);
XDR_DESTROY(xdrs);
if (rcvd == sent)
goto done_broad;
else
goto recv_again;
}
if (!rcvd)
clnt_stat = RPC_TIMEDOUT;
done_broad:
if (rcvd) {
*mfs_out = sort_responses(tr_head);
clnt_stat = RPC_SUCCESS;
}
free_transports(tr_head);
AUTH_DESTROY(sys_auth);
return (clnt_stat);
}
static struct mapfs *
sort_responses(trans)
struct transp *trans;
{
struct transp *t;
struct addrs *a;
struct tstamps *ti;
int i, size = 0, allocsize = 10;
struct mapfs *p, *mfs_head = NULL, *mfs_tail = NULL;
struct sm *buffer;
buffer = (struct sm *)malloc(allocsize * sizeof (struct sm));
if (!buffer) {
syslog(LOG_ERR, "sort_responses: malloc error.\n");
return (NULL);
}
for (t = trans; t; t = t->tr_next) {
for (a = t->tr_addrs; a; a = a->addr_next) {
for (ti = a->addr_if_tstamps;
ti; ti = ti->ts_next) {
if (!ti->ts_rcvd)
continue;
ti->ts_timeval.tv_usec +=
(ti->ts_penalty * PENALTY_WEIGHT);
if (ti->ts_timeval.tv_usec >= 1000000) {
ti->ts_timeval.tv_sec +=
(ti->ts_timeval.tv_usec / 1000000);
ti->ts_timeval.tv_usec =
(ti->ts_timeval.tv_usec % 1000000);
}
if (size >= allocsize) {
allocsize += 10;
buffer = (struct sm *)realloc(buffer,
allocsize * sizeof (struct sm));
if (!buffer) {
syslog(LOG_ERR,
"sort_responses: malloc error.\n");
return (NULL);
}
}
buffer[size].timeval = ti->ts_timeval;
buffer[size].mfs = a->addr_mfs;
size++;
}
}
}
#ifdef DEBUG
if (trace > 3) {
trace_prt(1, " sort_responses: before host sort:\n");
for (i = 0; i < size; i++)
trace_prt(1, " %s %d.%d\n", buffer[i].mfs->mfs_host,
buffer[i].timeval.tv_sec, buffer[i].timeval.tv_usec);
trace_prt(0, "\n");
}
#endif
qsort((void *)buffer, size, sizeof (struct sm), host_sm);
for (i = 1; i < size; i++) {
#ifdef DEBUG
if (trace > 3) {
trace_prt(1, " sort_responses: comparing %s and %s\n",
buffer[i-1].mfs->mfs_host,
buffer[i].mfs->mfs_host);
}
#endif
if (strcmp(buffer[i-1].mfs->mfs_host,
buffer[i].mfs->mfs_host) == 0)
memcpy(&buffer[i].timeval, &buffer[i-1].timeval,
sizeof (struct timeval));
}
if (trace > 3)
trace_prt(0, "\n");
#ifdef DEBUG
if (trace > 3) {
trace_prt(1, " sort_responses: before time sort:\n");
for (i = 0; i < size; i++)
trace_prt(1, " %s %d.%d\n", buffer[i].mfs->mfs_host,
buffer[i].timeval.tv_sec, buffer[i].timeval.tv_usec);
trace_prt(0, "\n");
}
#endif
qsort((void *)buffer, size, sizeof (struct sm), time_sm);
#ifdef DEBUG
if (trace > 3) {
trace_prt(1, " sort_responses: after sort:\n");
for (i = 0; i < size; i++)
trace_prt(1, " %s %d.%d\n", buffer[i].mfs->mfs_host,
buffer[i].timeval.tv_sec, buffer[i].timeval.tv_usec);
trace_prt(0, "\n");
}
#endif
for (i = 0; i < size; i++) {
#ifdef DEBUG
if (trace > 3) {
trace_prt(1, " sort_responses: adding %s\n",
buffer[i].mfs->mfs_host);
}
#endif
p = add_mfs(buffer[i].mfs, 0, &mfs_head, &mfs_tail);
if (!p)
return (NULL);
}
free(buffer);
return (mfs_head);
}
static int host_sm(const void *a, const void *b)
{
return (strcmp(((struct sm *)a)->mfs->mfs_host,
((struct sm *)b)->mfs->mfs_host));
}
static int time_sm(const void *a, const void *b)
{
if (timercmp(&(((struct sm *)a)->timeval),
&(((struct sm *)b)->timeval), < ))
return (-1);
else if (timercmp(&(((struct sm *)a)->timeval),
&(((struct sm *)b)->timeval), > ))
return (1);
else
return (0);
}
static void
calc_resp_time(send_time)
struct timeval *send_time;
{
struct timeval time_now;
(void) gettimeofday(&time_now, (struct timezone *)0);
if (time_now.tv_usec < send_time->tv_usec) {
time_now.tv_sec--;
time_now.tv_usec += 1000000;
}
send_time->tv_sec = time_now.tv_sec - send_time->tv_sec;
send_time->tv_usec = time_now.tv_usec - send_time->tv_usec;
}
static void
free_transports(trans)
struct transp *trans;
{
struct transp *t, *tmpt = NULL;
struct addrs *a, *tmpa = NULL;
struct tstamps *ts, *tmpts = NULL;
for (t = trans; t; t = tmpt) {
if (t->tr_fd > 0)
(void) close(t->tr_fd);
for (a = t->tr_addrs; a; a = tmpa) {
for (ts = a->addr_if_tstamps; ts; ts = tmpts) {
tmpts = ts->ts_next;
free(ts);
}
freehostent(a->addr_addrs);
tmpa = a->addr_next;
free(a);
}
tmpt = t->tr_next;
free(t);
}
}