2 * Send NSM notify calls to all hosts listed in /var/lib/sm
4 * Copyright (C) 2004-2006 Olaf Kirch <okir@suse.de>
11 #include <sys/types.h>
12 #include <sys/socket.h>
15 #include <sys/param.h>
16 #include <sys/syslog.h>
17 #include <arpa/inet.h>
33 # define BASEDIR NFS_STATEDIR
35 # define BASEDIR "/var/lib/nfs"
39 #define DEFAULT_SM_STATE_PATH BASEDIR "/state"
40 #define DEFAULT_SM_DIR_PATH BASEDIR "/sm"
41 #define DEFAULT_SM_BAK_PATH DEFAULT_SM_DIR_PATH ".bak"
43 char *_SM_BASE_PATH = BASEDIR;
44 char *_SM_STATE_PATH = DEFAULT_SM_STATE_PATH;
45 char *_SM_DIR_PATH = DEFAULT_SM_DIR_PATH;
46 char *_SM_BAK_PATH = DEFAULT_SM_BAK_PATH;
48 #define NSM_PROG 100024
49 #define NSM_PROGRAM 100024
53 #define NSM_MAX_TIMEOUT 120 /* don't make this too big */
54 #define MAXMSGSIZE 256
56 typedef struct sockaddr_storage nsm_address;
59 struct nsm_host * next;
71 static char nsm_hostname[256];
72 static uint32_t nsm_state;
73 static int opt_debug = 0;
74 static int opt_quiet = 0;
75 static int opt_update_state = 1;
76 static unsigned int opt_max_retry = 15 * 60;
77 static char * opt_srcaddr = 0;
78 static uint16_t opt_srcport = 0;
79 static int log_syslog = 0;
81 static unsigned int nsm_get_state(int);
82 static void notify(void);
83 static int notify_host(int, struct nsm_host *);
84 static void recv_reply(int);
85 static void backup_hosts(const char *, const char *);
86 static void get_hosts(const char *);
87 static void insert_host(struct nsm_host *);
88 struct nsm_host * find_host(uint32_t);
89 static int addr_get_port(nsm_address *);
90 static void addr_set_port(nsm_address *, int);
91 static struct addrinfo *host_lookup(int, const char *);
92 void nsm_log(int fac, const char *fmt, ...);
93 static int record_pid(void);
94 static void drop_privs(void);
95 static void set_kernel_nsm_state(int state);
97 static struct nsm_host * hosts = NULL;
100 main(int argc, char **argv)
105 while ((c = getopt(argc, argv, "dm:np:v:qP:f")) != -1) {
114 opt_max_retry = atoi(optarg) * 60;
117 opt_update_state = 0;
120 opt_srcport = atoi(optarg);
123 opt_srcaddr = optarg;
129 _SM_BASE_PATH = strdup(optarg);
130 _SM_STATE_PATH = malloc(strlen(optarg)+1+sizeof("state"));
131 _SM_DIR_PATH = malloc(strlen(optarg)+1+sizeof("sm"));
132 _SM_BAK_PATH = malloc(strlen(optarg)+1+sizeof("sm.bak"));
133 if (_SM_BASE_PATH == NULL ||
134 _SM_STATE_PATH == NULL ||
135 _SM_DIR_PATH == NULL ||
136 _SM_BAK_PATH == NULL) {
137 nsm_log(LOG_WARNING, "unable to allocate memory");
140 strcat(strcpy(_SM_STATE_PATH, _SM_BASE_PATH), "/state");
141 strcat(strcpy(_SM_DIR_PATH, _SM_BASE_PATH), "/sm");
142 strcat(strcpy(_SM_BAK_PATH, _SM_BASE_PATH), "/sm.bak");
151 usage: fprintf(stderr,
152 "Usage: sm-notify [-dfq] [-m max-retry-minutes] [-p srcport]\n"
153 " [-P /path/to/state/directory] [-v my_host_name]\n");
157 if (strcmp(_SM_BASE_PATH, BASEDIR) == 0) {
158 if (record_pid() == 0 && force == 0 && opt_update_state == 1)
159 /* already run, don't try again */
164 strncpy(nsm_hostname, opt_srcaddr, sizeof(nsm_hostname)-1);
166 if (gethostname(nsm_hostname, sizeof(nsm_hostname)) < 0) {
167 perror("gethostname");
171 backup_hosts(_SM_DIR_PATH, _SM_BAK_PATH);
172 get_hosts(_SM_BAK_PATH);
174 /* Get and update the NSM state. This will call sync() */
175 nsm_state = nsm_get_state(opt_update_state);
176 set_kernel_nsm_state(nsm_state);
180 printf("Backgrounding to notify hosts...\n");
182 openlog("sm-notify", LOG_PID, LOG_DAEMON);
185 if (daemon(0, 0) < 0) {
186 nsm_log(LOG_WARNING, "unable to background: %s",
201 while ((hp = hosts) != 0) {
204 "Unable to notify %s, giving up",
219 nsm_address local_addr;
225 sock = socket(AF_INET, SOCK_DGRAM, 0);
230 fcntl(sock, F_SETFL, O_NONBLOCK);
232 memset(&local_addr, 0, sizeof(local_addr));
233 local_addr.ss_family = AF_INET; /* Default to IPv4 */
235 /* Bind source IP if provided on command line */
237 struct addrinfo *ai = host_lookup(AF_INET, opt_srcaddr);
240 "Not a valid hostname or address: \"%s\"\n",
244 memcpy(&local_addr, ai->ai_addr, ai->ai_addrlen);
245 /* We know it's IPv4 at this point */
248 /* Use source port if provided on the command line,
249 * otherwise use bindresvport */
251 addr_set_port(&local_addr, opt_srcport);
252 if (bind(sock, (struct sockaddr *) &local_addr, sizeof(local_addr)) < 0) {
258 struct sockaddr_in *sin = (struct sockaddr_in *)&local_addr;
259 (void) bindresvport(sock, sin);
260 /* try to avoid known ports */
261 se = getservbyport(sin->sin_port, "udp");
262 if (se && retry_cnt < 100) {
270 failtime = time(NULL) + opt_max_retry;
276 time_t now = time(NULL);
277 unsigned int sent = 0;
281 if (failtime && now >= failtime)
284 while (hosts && ((wait = hosts->send_next - now) <= 0)) {
285 /* Never send more than 10 packets at once */
289 /* Remove queue head */
293 if (notify_host(sock, hp)){
301 /* Set the timeout for this call, using an
302 exponential timeout strategy */
304 if ((hp->timeout <<= 1) > NSM_MAX_TIMEOUT)
305 hp->timeout = NSM_MAX_TIMEOUT;
306 hp->send_next = now + wait;
314 nsm_log(LOG_DEBUG, "Host %s due in %ld seconds",
323 if (poll(&pfd, 1, wait) != 1)
331 * Send notification to a single host
334 notify_host(int sock, struct nsm_host *host)
336 static unsigned int xid = 0;
338 uint32_t msgbuf[MAXMSGSIZE], *p;
342 xid = getpid() + time(NULL);
346 if (host->ai == NULL) {
347 host->ai = host_lookup(AF_UNSPEC, host->name);
348 if (host->ai == NULL) {
350 "%s doesn't seem to be a valid address,"
351 " skipped", host->name);
356 memset(msgbuf, 0, sizeof(msgbuf));
358 *p++ = htonl(host->xid);
362 /* If we retransmitted 4 times, reset the port to force
363 * a new portmap lookup (in case statd was restarted).
364 * We also rotate through multiple IP addresses at this
367 if (host->retries >= 4) {
368 struct addrinfo *first = host->ai;
369 struct addrinfo **next = &host->ai;
371 /* remove the first entry from the list */
372 host->ai = first->ai_next;
373 first->ai_next = NULL;
374 /* find the end of the list */
375 next = &first->ai_next;
377 next = & (*next)->ai_next;
378 /* put first entry at end */
380 memcpy(&host->addr, first->ai_addr, first->ai_addrlen);
381 addr_set_port(&host->addr, 0);
386 if (addr_get_port(&dest) == 0) {
387 /* Build a PMAP packet */
388 nsm_log(LOG_DEBUG, "Sending portmap query to %s", host->name);
390 addr_set_port(&dest, 111);
391 *p++ = htonl(100000);
399 *p++ = htonl(NSM_PROGRAM);
400 *p++ = htonl(NSM_VERSION);
401 *p++ = htonl(IPPROTO_UDP);
404 /* Build an SM_NOTIFY packet */
405 nsm_log(LOG_DEBUG, "Sending SM_NOTIFY to %s", host->name);
407 *p++ = htonl(NSM_PROGRAM);
408 *p++ = htonl(NSM_VERSION);
409 *p++ = htonl(NSM_NOTIFY);
416 len = strlen(nsm_hostname);
418 memcpy(p, nsm_hostname, len);
420 *p++ = htonl(nsm_state);
422 len = (p - msgbuf) << 2;
424 if (sendto(sock, msgbuf, len, 0, (struct sockaddr *) &dest, sizeof(dest)) < 0)
425 nsm_log(LOG_WARNING, "Sending Reboot Notification to "
426 "'%s' failed: errno %d (%s)", host->name, errno, strerror(errno));
432 * Receive reply from remote host
438 uint32_t msgbuf[MAXMSGSIZE], *p, *end;
442 res = recv(sock, msgbuf, sizeof(msgbuf), 0);
446 nsm_log(LOG_DEBUG, "Received packet...");
449 end = p + (res >> 2);
452 if (*p++ != htonl(1) /* must be REPLY */
453 || *p++ != htonl(0) /* must be ACCEPTED */
454 || *p++ != htonl(0) /* must be NULL verifier */
456 || *p++ != htonl(0)) /* must be SUCCESS */
459 /* Before we look at the data, find the host struct for
461 if ((hp = find_host(xid)) == NULL)
464 if (addr_get_port(&hp->addr) == 0) {
465 /* This was a portmap request */
472 hp->send_next = time(NULL);
474 /* No binding for statd. Delay the next
475 * portmap query for max timeout */
476 nsm_log(LOG_DEBUG, "No statd on %s", hp->name);
477 hp->timeout = NSM_MAX_TIMEOUT;
478 hp->send_next += NSM_MAX_TIMEOUT;
480 addr_set_port(&hp->addr, port);
481 if (hp->timeout >= NSM_MAX_TIMEOUT / 4)
482 hp->timeout = NSM_MAX_TIMEOUT / 4;
486 /* Successful NOTIFY call. Server returns void,
487 * so nothing we need to do here (except
488 * check that we didn't read past the end of the
492 nsm_log(LOG_DEBUG, "Host %s notified successfully", hp->name);
497 freeaddrinfo(hp->ai);
502 fail: /* Re-insert the host */
507 * Back up all hosts from the sm directory to sm.bak
510 backup_hosts(const char *dirname, const char *bakname)
515 if (!(dir = opendir(dirname))) {
520 while ((de = readdir(dir)) != NULL) {
521 char src[1024], dst[1024];
523 if (de->d_name[0] == '.')
526 snprintf(src, sizeof(src), "%s/%s", dirname, de->d_name);
527 snprintf(dst, sizeof(dst), "%s/%s", bakname, de->d_name);
528 if (rename(src, dst) < 0) {
530 "Failed to rename %s -> %s: %m",
538 * Get all entries from sm.bak and convert them to host entries
541 get_hosts(const char *dirname)
543 struct nsm_host *host;
547 if (!(dir = opendir(dirname))) {
553 while ((de = readdir(dir)) != NULL) {
557 if (de->d_name[0] == '.')
560 host = calloc(1, sizeof(*host));
562 snprintf(path, sizeof(path), "%s/%s", dirname, de->d_name);
563 if (stat(path, &stb) < 0)
566 host->last_used = stb.st_mtime;
567 host->timeout = NSM_TIMEOUT;
568 host->path = strdup(path);
569 host->name = strdup(de->d_name);
570 host->retries = 100; /* force address retry */
582 * Insert host into sorted list
585 insert_host(struct nsm_host *host)
587 struct nsm_host **where, *p;
590 while ((p = *where) != 0) {
591 /* Sort in ascending order of timeout */
592 if (host->send_next < p->send_next)
594 /* If we have the same timeout, put the
595 * most recently used host first.
596 * This makes sure that "recent" hosts
597 * get notified first.
599 if (host->send_next == p->send_next
600 && host->last_used > p->last_used)
610 * Find host given the XID
613 find_host(uint32_t xid)
615 struct nsm_host **where, *p;
618 while ((p = *where) != 0) {
630 * Retrieve the current NSM state
633 nsm_get_state(int update)
635 char newfile[PATH_MAX];
638 if ((fd = open(_SM_STATE_PATH, O_RDONLY)) < 0) {
640 nsm_log(LOG_WARNING, "%s: %m", _SM_STATE_PATH);
641 nsm_log(LOG_WARNING, "Creating %s, set initial state 1",
647 if (read(fd, &state, sizeof(state)) != sizeof(state)) {
649 "%s: bad file size, setting state = 1",
662 snprintf(newfile, sizeof(newfile),
663 "%s.new", _SM_STATE_PATH);
664 if ((fd = open(newfile, O_CREAT|O_WRONLY, 0644)) < 0) {
665 nsm_log(LOG_WARNING, "Cannot create %s: %m", newfile);
668 if (write(fd, &state, sizeof(state)) != sizeof(state)) {
670 "Failed to write state to %s", newfile);
674 if (rename(newfile, _SM_STATE_PATH) < 0) {
676 "Cannot create %s: %m", _SM_STATE_PATH);
686 * Address handling utilities
690 addr_get_port(nsm_address *addr)
692 switch (((struct sockaddr *) addr)->sa_family) {
694 return ntohs(((struct sockaddr_in *) addr)->sin_port);
696 return ntohs(((struct sockaddr_in6 *) addr)->sin6_port);
702 addr_set_port(nsm_address *addr, int port)
704 switch (((struct sockaddr *) addr)->sa_family) {
706 ((struct sockaddr_in *) addr)->sin_port = htons(port);
709 ((struct sockaddr_in6 *) addr)->sin6_port = htons(port);
713 static struct addrinfo *
714 host_lookup(int af, const char *name)
716 struct addrinfo hints, *ai;
718 memset(&hints, 0, sizeof(hints));
719 hints.ai_family = af;
720 hints.ai_protocol = IPPROTO_UDP;
722 if (getaddrinfo(name, NULL, &hints, &ai) != 0)
732 nsm_log(int fac, const char *fmt, ...)
736 if (fac == LOG_DEBUG && !opt_debug)
741 vsyslog(fac, fmt, ap);
743 vfprintf(stderr, fmt, ap);
750 * Record pid in /var/run/sm-notify.pid
751 * This file should remain until a reboot, even if the
753 * If file already exists, fail.
755 static int record_pid(void)
760 snprintf(pid, 20, "%d\n", getpid());
761 fd = open("/var/run/sm-notify.pid", O_CREAT|O_EXCL|O_WRONLY, 0600);
764 write(fd, pid, strlen(pid));
769 /* Drop privileges to match owner of state-directory
770 * (in case a reply triggers some unknown bug).
772 static void drop_privs(void)
776 if (stat(_SM_DIR_PATH, &st) == -1 &&
777 stat(_SM_BASE_PATH, &st) == -1) {
782 if (st.st_uid == 0) {
784 "sm-notify running as root. chown %s to choose different user\n",
790 if (setgid(st.st_gid) == -1
791 || setuid(st.st_uid) == -1) {
792 nsm_log(LOG_ERR, "Fail to drop privileges");
797 static void set_kernel_nsm_state(int state)
801 fd = open("/proc/sys/fs/nfs/nsm_local_state",O_WRONLY);
804 snprintf(buf, sizeof(buf), "%d", state);
805 write(fd, buf, strlen(buf));